han1823123123 commited on
Commit
e8d07d9
·
verified ·
1 Parent(s): 495c04f

Upload training_logs/txc_bare_antidead_t5__seed2.json with huggingface_hub

Browse files
training_logs/txc_bare_antidead_t5__seed2.json ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "loss": [
3
+ 18225.08203125,
4
+ 5529.5791015625,
5
+ 4895.27392578125,
6
+ 4545.2705078125,
7
+ 4250.55615234375,
8
+ 4072.169921875,
9
+ 4004.07080078125,
10
+ 3863.221923828125,
11
+ 3780.98291015625,
12
+ 3743.45166015625,
13
+ 3708.831298828125,
14
+ 3641.944580078125,
15
+ 3606.340576171875,
16
+ 3620.38134765625,
17
+ 3587.888427734375,
18
+ 3568.888427734375,
19
+ 3557.522705078125,
20
+ 3519.996826171875,
21
+ 3512.595703125,
22
+ 3483.601318359375,
23
+ 3474.846435546875,
24
+ 3443.065185546875,
25
+ 3454.44384765625,
26
+ 3438.76806640625,
27
+ 3472.262451171875,
28
+ 3455.16015625
29
+ ],
30
+ "l0": [
31
+ 500.0,
32
+ 496.24365234375,
33
+ 496.251220703125,
34
+ 495.40625,
35
+ 493.69140625,
36
+ 493.0595703125,
37
+ 492.3154296875,
38
+ 492.218017578125,
39
+ 491.462890625,
40
+ 491.395263671875,
41
+ 492.19140625,
42
+ 492.17236328125,
43
+ 491.419921875,
44
+ 492.16259765625,
45
+ 491.4326171875,
46
+ 490.93701171875,
47
+ 490.2861328125,
48
+ 491.725341796875,
49
+ 492.156005859375,
50
+ 490.299560546875,
51
+ 490.712890625,
52
+ 490.790283203125,
53
+ 491.512939453125,
54
+ 491.12109375,
55
+ 491.15185546875,
56
+ 492.138427734375
57
+ ],
58
+ "steps_logged": [
59
+ 0,
60
+ 200,
61
+ 400,
62
+ 600,
63
+ 800,
64
+ 1000,
65
+ 1200,
66
+ 1400,
67
+ 1600,
68
+ 1800,
69
+ 2000,
70
+ 2200,
71
+ 2400,
72
+ 2600,
73
+ 2800,
74
+ 3000,
75
+ 3200,
76
+ 3400,
77
+ 3600,
78
+ 3800,
79
+ 4000,
80
+ 4200,
81
+ 4400,
82
+ 4600,
83
+ 4800,
84
+ 5000
85
+ ],
86
+ "final_step": 5000,
87
+ "converged": true,
88
+ "plateau_last": 0.016232855159720415,
89
+ "elapsed_s": 1491.821403503418,
90
+ "row": 9,
91
+ "arch_id": "txc_bare_antidead_t5",
92
+ "arch": "txc_bare_antidead_t5",
93
+ "group": 2,
94
+ "src_class": "TXCBareAntidead",
95
+ "src_module": "src.architectures.txc_bare_antidead",
96
+ "T": 5,
97
+ "T_max": null,
98
+ "t_sample": null,
99
+ "n_layers": null,
100
+ "k_win": 500,
101
+ "k_pos": 100,
102
+ "shifts": null,
103
+ "alpha": null,
104
+ "gamma": null,
105
+ "n_scales": null,
106
+ "seed": 2,
107
+ "d_in": 2304,
108
+ "d_sae": 18432,
109
+ "subject_model": "google/gemma-2-2b",
110
+ "anchor_layer": 12,
111
+ "mlc_layers": [
112
+ 10,
113
+ 11,
114
+ 12,
115
+ 13,
116
+ 14
117
+ ],
118
+ "phase": "phase7_unification",
119
+ "run_id": "txc_bare_antidead_t5__seed2"
120
+ }