han1823123123 commited on
Commit
4892b74
·
verified ·
1 Parent(s): d0a5835

agent=agent_hammer train_key=07e46d901a3791c0

Browse files
07e46d901a3791c0/config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "act_cache_key": "053e9f2dbd2d3aae",
3
+ "agent": "agent_hammer",
4
+ "arch": "stacked_sae",
5
+ "arch_version": "1.0.0",
6
+ "datasource": "toy_coupled_noisy_K10_M20_d256_pB05_np10_rho06",
7
+ "saved_ts": "2026-05-07T01:23:03Z",
8
+ "seed": 2,
9
+ "train_key": "07e46d901a3791c0",
10
+ "training_cfg": {
11
+ "arch_hparams_override": {
12
+ "T": 2,
13
+ "d_sae": 40,
14
+ "k_pos": 2
15
+ },
16
+ "batch_size": 1024,
17
+ "bricken_enabled": false,
18
+ "bricken_max_resample_fraction": 0.5,
19
+ "bricken_min_fires": 1,
20
+ "bricken_n_check": 2048,
21
+ "bricken_resample_every": 500,
22
+ "dead_threshold_tokens": 10000000,
23
+ "ema_auxk_alpha": 0.03125,
24
+ "learning_rate": 0.0003,
25
+ "n_steps": 8000,
26
+ "optimizer": "adam",
27
+ "plateau_early_stop": false,
28
+ "plateau_min_delta": 0.0001,
29
+ "plateau_patience": 5000,
30
+ "precision": "bf16",
31
+ "train_window_size": null,
32
+ "warmup_steps": 1000
33
+ }
34
+ }
07e46d901a3791c0/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e82163e1812620517a42fe2b77a45f2666f79ee6df884f945f424bc57e838e28
3
+ size 166824