han1823123123 commited on
Commit
cd97af9
·
verified ·
1 Parent(s): 8c64131

agent=agent_em train_key=b300a6a0d26196a6

Browse files
b300a6a0d26196a6/config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "act_cache_key": "e052801ef8e6d22b",
3
+ "agent": "agent_em",
4
+ "arch": "sae_arditi",
5
+ "arch_version": "1.0.0",
6
+ "datasource": "qwen_2_5_14b_instruct_finance_l24_resid_post",
7
+ "saved_ts": "2026-05-04T00:11:25Z",
8
+ "seed": 1,
9
+ "train_key": "b300a6a0d26196a6",
10
+ "training_cfg": {
11
+ "batch_size": 256,
12
+ "bricken_enabled": false,
13
+ "bricken_max_resample_fraction": 0.5,
14
+ "bricken_min_fires": 1,
15
+ "bricken_n_check": 2048,
16
+ "bricken_resample_every": 500,
17
+ "dead_threshold_tokens": 10000000,
18
+ "ema_auxk_alpha": 0.0,
19
+ "learning_rate": 0.0003,
20
+ "n_steps": 30000,
21
+ "optimizer": "adam",
22
+ "plateau_early_stop": false,
23
+ "plateau_min_delta": 0.0001,
24
+ "plateau_patience": 5000,
25
+ "precision": "bf16",
26
+ "warmup_steps": 1000
27
+ }
28
+ }
b300a6a0d26196a6/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afb726521522eeab1572b5b62a58a687bca4202cf040adb8e96d77c1c38330b2
3
+ size 1342329160