han1823123123 commited on
Commit
d3ac32d
·
verified ·
1 Parent(s): f39e1c8

Upload training_logs/txcdr_t7__seed2.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_logs/txcdr_t7__seed2.json +120 -0
training_logs/txcdr_t7__seed2.json ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "loss": [
3
+ 56080.421875,
4
+ 6856.16259765625,
5
+ 6034.1064453125,
6
+ 5598.9052734375,
7
+ 5339.90625,
8
+ 5159.7578125,
9
+ 5041.169921875,
10
+ 4946.669921875,
11
+ 4878.232421875,
12
+ 4772.8173828125,
13
+ 4754.31591796875,
14
+ 4681.7568359375,
15
+ 4623.92138671875,
16
+ 4635.57421875,
17
+ 4600.3046875,
18
+ 4529.744140625,
19
+ 4545.169921875,
20
+ 4494.306640625,
21
+ 4526.4052734375,
22
+ 4510.4169921875,
23
+ 4436.6962890625,
24
+ 4414.267578125,
25
+ 4437.484375,
26
+ 4440.3876953125,
27
+ 4407.373046875,
28
+ 4375.6904296875
29
+ ],
30
+ "l0": [
31
+ 500.0,
32
+ 494.39697265625,
33
+ 494.12109375,
34
+ 494.83154296875,
35
+ 494.172119140625,
36
+ 492.957275390625,
37
+ 492.938232421875,
38
+ 492.335205078125,
39
+ 493.08642578125,
40
+ 492.0126953125,
41
+ 492.73681640625,
42
+ 491.357421875,
43
+ 490.5078125,
44
+ 493.208984375,
45
+ 492.582763671875,
46
+ 492.46728515625,
47
+ 491.911376953125,
48
+ 491.305419921875,
49
+ 493.31103515625,
50
+ 491.4091796875,
51
+ 491.3466796875,
52
+ 490.43603515625,
53
+ 491.9892578125,
54
+ 492.1416015625,
55
+ 490.90771484375,
56
+ 491.515869140625
57
+ ],
58
+ "steps_logged": [
59
+ 0,
60
+ 200,
61
+ 400,
62
+ 600,
63
+ 800,
64
+ 1000,
65
+ 1200,
66
+ 1400,
67
+ 1600,
68
+ 1800,
69
+ 2000,
70
+ 2200,
71
+ 2400,
72
+ 2600,
73
+ 2800,
74
+ 3000,
75
+ 3200,
76
+ 3400,
77
+ 3600,
78
+ 3800,
79
+ 4000,
80
+ 4200,
81
+ 4400,
82
+ 4600,
83
+ 4800,
84
+ 5000
85
+ ],
86
+ "final_step": 5000,
87
+ "converged": true,
88
+ "plateau_last": 0.019446190518349653,
89
+ "elapsed_s": 1393.7411108016968,
90
+ "row": 18,
91
+ "arch_id": "txcdr_t7",
92
+ "arch": "txcdr_t7",
93
+ "group": 3,
94
+ "src_class": "TemporalCrosscoder",
95
+ "src_module": "src.architectures.crosscoder",
96
+ "T": 7,
97
+ "T_max": null,
98
+ "t_sample": null,
99
+ "n_layers": null,
100
+ "k_win": 500,
101
+ "k_pos": 71,
102
+ "shifts": null,
103
+ "alpha": null,
104
+ "gamma": null,
105
+ "n_scales": null,
106
+ "seed": 2,
107
+ "d_in": 2304,
108
+ "d_sae": 18432,
109
+ "subject_model": "google/gemma-2-2b",
110
+ "anchor_layer": 12,
111
+ "mlc_layers": [
112
+ 10,
113
+ 11,
114
+ 12,
115
+ 13,
116
+ 14
117
+ ],
118
+ "phase": "phase7_unification",
119
+ "run_id": "txcdr_t7__seed2"
120
+ }