| { | |
| "model": "adhd", | |
| "layer": 1, | |
| "d_sae": 4096, | |
| "k": 40, | |
| "normalize_activations": "expected_average_only_in", | |
| "n_tokens": 10000000, | |
| "batch_size": 4096, | |
| "lr": 0.0003, | |
| "final_training": { | |
| "step": 2441, | |
| "loss": 3.830482244491577, | |
| "l0": 40.0, | |
| "fve": 0.9020028367114843, | |
| "n_dead": 5, | |
| "mse": 0.0073381345719099045 | |
| }, | |
| "dead_pct_heldout": 1.3671875 | |
| } |