han1823123123 commited on
Commit
b10f1c0
·
verified ·
1 Parent(s): f97c085

agent=agent_em_100k train_key=468da945c83f2334

Browse files
468da945c83f2334/config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "act_cache_key": "87b600e76b7ab26d",
3
+ "agent": "agent_em_100k",
4
+ "arch": "mlc",
5
+ "arch_version": "1.0.0",
6
+ "datasource": "gemma_2_2b_base_l11to15_fineweb_24k128",
7
+ "saved_ts": "2026-05-06T10:31:45Z",
8
+ "seed": 2,
9
+ "train_key": "468da945c83f2334",
10
+ "training_cfg": {
11
+ "arch_hparams_override": null,
12
+ "batch_size": 1024,
13
+ "bricken_enabled": false,
14
+ "bricken_max_resample_fraction": 0.5,
15
+ "bricken_min_fires": 1,
16
+ "bricken_n_check": 2048,
17
+ "bricken_resample_every": 500,
18
+ "dead_threshold_tokens": 10000000,
19
+ "ema_auxk_alpha": 0.03125,
20
+ "learning_rate": 0.0003,
21
+ "n_steps": 20000,
22
+ "optimizer": "adam",
23
+ "plateau_early_stop": false,
24
+ "plateau_min_delta": 0.0001,
25
+ "plateau_patience": 5000,
26
+ "precision": "bf16",
27
+ "train_window_size": null,
28
+ "warmup_steps": 1000
29
+ }
30
+ }
468da945c83f2334/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38dcf66a2a704cb00b1a594c51c38a0b729a74566ae8a0e3dde4bd0c5a0c544b
3
+ size 1698813264