han1823123123 commited on
Commit
af7677f
·
verified ·
1 Parent(s): 07f374f

Upload training_logs/txc_bare_antidead_t20__seed1.json with huggingface_hub

Browse files
training_logs/txc_bare_antidead_t20__seed1.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "loss": [
3
+ 16526.19140625,
4
+ 7570.45849609375,
5
+ 6897.53125,
6
+ 6591.27880859375,
7
+ 6346.61767578125,
8
+ 6263.02685546875,
9
+ 6168.20703125,
10
+ 6103.30322265625,
11
+ 6044.765625,
12
+ 5976.1328125,
13
+ 5997.23583984375,
14
+ 5960.052734375,
15
+ 5950.63037109375,
16
+ 5952.7470703125,
17
+ 5916.24951171875,
18
+ 5864.77734375,
19
+ 5878.50390625
20
+ ],
21
+ "l0": [
22
+ 500.0,
23
+ 497.27099609375,
24
+ 496.361328125,
25
+ 496.6953125,
26
+ 495.693115234375,
27
+ 495.964599609375,
28
+ 495.42138671875,
29
+ 494.422607421875,
30
+ 495.245361328125,
31
+ 493.708740234375,
32
+ 495.469970703125,
33
+ 494.835205078125,
34
+ 495.326904296875,
35
+ 494.803466796875,
36
+ 494.362060546875,
37
+ 493.102294921875,
38
+ 494.330810546875
39
+ ],
40
+ "steps_logged": [
41
+ 0,
42
+ 200,
43
+ 400,
44
+ 600,
45
+ 800,
46
+ 1000,
47
+ 1200,
48
+ 1400,
49
+ 1600,
50
+ 1800,
51
+ 2000,
52
+ 2200,
53
+ 2400,
54
+ 2600,
55
+ 2800,
56
+ 3000,
57
+ 3200
58
+ ],
59
+ "final_step": 3200,
60
+ "converged": true,
61
+ "plateau_last": 0.01723924005125929,
62
+ "elapsed_s": 3668.085907936096,
63
+ "row": 11,
64
+ "arch_id": "txc_bare_antidead_t20",
65
+ "arch": "txc_bare_antidead_t20",
66
+ "group": 2,
67
+ "src_class": "TXCBareAntidead",
68
+ "src_module": "src.architectures.txc_bare_antidead",
69
+ "T": 20,
70
+ "T_max": null,
71
+ "t_sample": null,
72
+ "n_layers": null,
73
+ "k_win": 500,
74
+ "k_pos": 25,
75
+ "shifts": null,
76
+ "alpha": null,
77
+ "gamma": null,
78
+ "n_scales": null,
79
+ "seed": 1,
80
+ "d_in": 2304,
81
+ "d_sae": 18432,
82
+ "subject_model": "google/gemma-2-2b",
83
+ "anchor_layer": 12,
84
+ "mlc_layers": [
85
+ 10,
86
+ 11,
87
+ 12,
88
+ 13,
89
+ 14
90
+ ],
91
+ "phase": "phase7_unification",
92
+ "run_id": "txc_bare_antidead_t20__seed1"
93
+ }