| { | |
| "model": "adhd", | |
| "layer": 2, | |
| "d_sae": 4096, | |
| "k": 40, | |
| "normalize_activations": "expected_average_only_in", | |
| "n_tokens": 10000000, | |
| "batch_size": 4096, | |
| "lr": 0.0003, | |
| "final_training": { | |
| "step": 2441, | |
| "loss": 7.990331649780273, | |
| "l0": 40.0, | |
| "fve": 0.8937416797380295, | |
| "n_dead": 1, | |
| "mse": 0.015545391477644444 | |
| }, | |
| "dead_pct_heldout": 1.46484375 | |
| } |