File size: 857 Bytes
50298ab
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
{
  "act_cache_key": "63abe7e716cc7392",
  "agent": "agent_hammer",
  "arch": "tsae_paper",
  "arch_version": "1.0.0",
  "datasource": "toy_coupled_K10_M20_d256",
  "saved_ts": "2026-05-06T22:49:33Z",
  "seed": 2,
  "train_key": "034e68fbf41b8489",
  "training_cfg": {
    "arch_hparams_override": {
      "d_sae": 40,
      "k_pos": 12
    },
    "batch_size": 1024,
    "bricken_enabled": false,
    "bricken_max_resample_fraction": 0.5,
    "bricken_min_fires": 1,
    "bricken_n_check": 2048,
    "bricken_resample_every": 500,
    "dead_threshold_tokens": 10000000,
    "ema_auxk_alpha": 0.03125,
    "learning_rate": 0.0003,
    "n_steps": 30000,
    "optimizer": "adam",
    "plateau_early_stop": false,
    "plateau_min_delta": 0.0001,
    "plateau_patience": 5000,
    "precision": "bf16",
    "train_window_size": 2,
    "warmup_steps": 1000
  }
}