| { | |
| "model": "adhd", | |
| "layer": 3, | |
| "d_sae": 4096, | |
| "k": 40, | |
| "normalize_activations": "expected_average_only_in", | |
| "n_tokens": 10000000, | |
| "batch_size": 4096, | |
| "lr": 0.0003, | |
| "final_training": { | |
| "step": 2441, | |
| "loss": 16.80815315246582, | |
| "l0": 40.0, | |
| "fve": 0.8691270860953982, | |
| "n_dead": 0, | |
| "mse": 0.032828424125909805 | |
| }, | |
| "dead_pct_heldout": 2.2216796875 | |
| } |