ojaffe commited on
Commit
58e2e4e
·
verified ·
1 Parent(s): 5a6434e

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. loss_history.json +15 -201
  2. model.pt +1 -1
  3. train.log +24 -64
loss_history.json CHANGED
@@ -1,233 +1,47 @@
1
  [
2
  {
3
  "epoch": 1,
4
- "phase": "P1",
5
- "loss": 0.152055
6
  },
7
  {
8
  "epoch": 2,
9
- "phase": "P1",
10
- "loss": 0.126681
11
  },
12
  {
13
  "epoch": 3,
14
- "phase": "P1",
15
- "loss": 0.119891
16
  },
17
  {
18
  "epoch": 4,
19
- "phase": "P1",
20
- "loss": 0.114801
21
  },
22
  {
23
  "epoch": 5,
24
- "phase": "P1",
25
- "loss": 0.110611
26
  },
27
  {
28
  "epoch": 6,
29
- "phase": "P1",
30
- "loss": 0.107016
31
  },
32
  {
33
  "epoch": 7,
34
- "phase": "P1",
35
- "loss": 0.103401
36
  },
37
  {
38
  "epoch": 8,
39
- "phase": "P1",
40
- "loss": 0.100012
41
  },
42
  {
43
  "epoch": 9,
44
- "phase": "P1",
45
- "loss": 0.096366
46
  },
47
  {
48
  "epoch": 10,
49
- "phase": "P1",
50
- "loss": 0.09296
51
- },
52
- {
53
- "epoch": 11,
54
- "phase": "P1",
55
- "loss": 0.089986
56
- },
57
- {
58
- "epoch": 12,
59
- "phase": "P1",
60
- "loss": 0.087143
61
- },
62
- {
63
- "epoch": 13,
64
- "phase": "P1",
65
- "loss": 0.08477
66
- },
67
- {
68
- "epoch": 14,
69
- "phase": "P1",
70
- "loss": 0.083114
71
- },
72
- {
73
- "epoch": 15,
74
- "phase": "P1",
75
- "loss": 0.082026
76
- },
77
- {
78
- "epoch": 16,
79
- "phase": "P2",
80
- "loss": 0.122125
81
- },
82
- {
83
- "epoch": 17,
84
- "phase": "P2",
85
- "loss": 0.118517
86
- },
87
- {
88
- "epoch": 18,
89
- "phase": "P2",
90
- "loss": 0.115646
91
- },
92
- {
93
- "epoch": 19,
94
- "phase": "P2",
95
- "loss": 0.170965
96
- },
97
- {
98
- "epoch": 20,
99
- "phase": "P2",
100
- "loss": 0.163493,
101
- "val_ssim": 0.8267
102
- },
103
- {
104
- "epoch": 21,
105
- "phase": "P2",
106
- "loss": 0.159067
107
- },
108
- {
109
- "epoch": 22,
110
- "phase": "P2",
111
- "loss": 0.237583
112
- },
113
- {
114
- "epoch": 23,
115
- "phase": "P2",
116
- "loss": 0.229664
117
- },
118
- {
119
- "epoch": 24,
120
- "phase": "P2",
121
- "loss": 0.221985
122
- },
123
- {
124
- "epoch": 25,
125
- "phase": "P2",
126
- "loss": 0.215313,
127
- "val_ssim": 0.8505
128
- },
129
- {
130
- "epoch": 26,
131
- "phase": "P2",
132
- "loss": 0.208722
133
- },
134
- {
135
- "epoch": 27,
136
- "phase": "P2",
137
- "loss": 0.203962
138
- },
139
- {
140
- "epoch": 28,
141
- "phase": "P2",
142
- "loss": 0.198393
143
- },
144
- {
145
- "epoch": 29,
146
- "phase": "P2",
147
- "loss": 0.194795
148
- },
149
- {
150
- "epoch": 30,
151
- "phase": "P2",
152
- "loss": 0.191285,
153
- "val_ssim": 0.8759
154
- },
155
- {
156
- "epoch": 31,
157
- "phase": "P2",
158
- "loss": 0.187651
159
- },
160
- {
161
- "epoch": 32,
162
- "phase": "P2",
163
- "loss": 0.184686
164
- },
165
- {
166
- "epoch": 33,
167
- "phase": "P2",
168
- "loss": 0.180715
169
- },
170
- {
171
- "epoch": 34,
172
- "phase": "P2",
173
- "loss": 0.176762
174
- },
175
- {
176
- "epoch": 35,
177
- "phase": "P2",
178
- "loss": 0.172307,
179
- "val_ssim": 0.8774
180
- },
181
- {
182
- "epoch": 36,
183
- "phase": "P2",
184
- "loss": 0.167519
185
- },
186
- {
187
- "epoch": 37,
188
- "phase": "P2",
189
- "loss": 0.162766
190
- },
191
- {
192
- "epoch": 38,
193
- "phase": "P2",
194
- "loss": 0.157198
195
- },
196
- {
197
- "epoch": 39,
198
- "phase": "P2",
199
- "loss": 0.152165
200
- },
201
- {
202
- "epoch": 40,
203
- "phase": "P2",
204
- "loss": 0.147043,
205
- "val_ssim": 0.886
206
- },
207
- {
208
- "epoch": 41,
209
- "phase": "P2",
210
- "loss": 0.141957
211
- },
212
- {
213
- "epoch": 42,
214
- "phase": "P2",
215
- "loss": 0.137481
216
- },
217
- {
218
- "epoch": 43,
219
- "phase": "P2",
220
- "loss": 0.133861
221
- },
222
- {
223
- "epoch": 44,
224
- "phase": "P2",
225
- "loss": 0.131363
226
- },
227
- {
228
- "epoch": 45,
229
- "phase": "P2",
230
- "loss": 0.129965,
231
- "val_ssim": 0.888
232
  }
233
  ]
 
1
  [
2
  {
3
  "epoch": 1,
4
+ "loss": 0.093453
 
5
  },
6
  {
7
  "epoch": 2,
8
+ "loss": 0.092451,
9
+ "val_ssim": 0.8883
10
  },
11
  {
12
  "epoch": 3,
13
+ "loss": 0.091656
 
14
  },
15
  {
16
  "epoch": 4,
17
+ "loss": 0.090955,
18
+ "val_ssim": 0.8887
19
  },
20
  {
21
  "epoch": 5,
22
+ "loss": 0.090331
 
23
  },
24
  {
25
  "epoch": 6,
26
+ "loss": 0.089821,
27
+ "val_ssim": 0.8885
28
  },
29
  {
30
  "epoch": 7,
31
+ "loss": 0.089413
 
32
  },
33
  {
34
  "epoch": 8,
35
+ "loss": 0.08911,
36
+ "val_ssim": 0.8883
37
  },
38
  {
39
  "epoch": 9,
40
+ "loss": 0.088879
 
41
  },
42
  {
43
  "epoch": 10,
44
+ "loss": 0.088735,
45
+ "val_ssim": 0.8881
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  ]
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e930868e7c620774f7f12cd9c2f056032024e50b17bd1405824daa5df80ecb6b
3
  size 12361376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a42ae34436c3bf75bb101d51446c6a4bb2f36b9bc6cfe1f06ebf301b519c35ad
3
  size 12361376
train.log CHANGED
@@ -1,64 +1,24 @@
1
- [05:19:55] Device: cuda
2
- [05:19:55] Model parameters: 6,169,586, channels=[56, 112, 224]
3
- [05:19:55] Phase 1: Single-step (15 epochs)
4
- [05:19:59] 45108 sequences
5
- [05:20:50] P1 Epoch 1/15 | loss=0.15205
6
- [05:21:41] P1 Epoch 2/15 | loss=0.12668
7
- [05:22:29] P1 Epoch 3/15 | loss=0.11989
8
- [05:23:16] P1 Epoch 4/15 | loss=0.11480
9
- [05:24:08] P1 Epoch 5/15 | loss=0.11061
10
- [05:24:54] P1 Epoch 6/15 | loss=0.10702
11
- [05:25:46] P1 Epoch 7/15 | loss=0.10340
12
- [05:26:37] P1 Epoch 8/15 | loss=0.10001
13
- [05:27:23] P1 Epoch 9/15 | loss=0.09637
14
- [05:28:12] P1 Epoch 10/15 | loss=0.09296
15
- [05:29:02] P1 Epoch 11/15 | loss=0.08999
16
- [05:29:51] P1 Epoch 12/15 | loss=0.08714
17
- [05:30:40] P1 Epoch 13/15 | loss=0.08477
18
- [05:31:30] P1 Epoch 14/15 | loss=0.08311
19
- [05:32:17] P1 Epoch 15/15 | loss=0.08203
20
- [05:32:17] Phase 2: Graduated AR (30 epochs)
21
- [05:34:32] P2 Epoch 1/30 (steps=2) | loss=0.12213 lr=0.000500
22
- [05:36:49] P2 Epoch 2/30 (steps=2) | loss=0.11852 lr=0.000500
23
- [05:38:58] P2 Epoch 3/30 (steps=2) | loss=0.11565 lr=0.000500
24
- [05:44:14] P2 Epoch 4/30 (steps=4) | loss=0.17096 lr=0.000500
25
- [05:49:31] P2 Epoch 5/30 (steps=4) | loss=0.16349 lr=0.000500
26
- [05:50:57] Val SSIM=0.8267 | {'pong': 0.7258, 'sonic': 0.8199, 'pole_position': 0.9343}
27
- [05:50:57] New best! SSIM=0.8267
28
- [05:56:10] P2 Epoch 6/30 (steps=4) | loss=0.15907 lr=0.000500
29
- [06:10:41] P2 Epoch 7/30 (steps=8) | loss=0.23758 lr=0.000500
30
- [06:24:53] P2 Epoch 8/30 (steps=8) | loss=0.22966 lr=0.000500
31
- [06:39:05] P2 Epoch 9/30 (steps=8) | loss=0.22198 lr=0.000500
32
- [06:53:24] P2 Epoch 10/30 (steps=8) | loss=0.21531 lr=0.000500
33
- [06:54:54] Val SSIM=0.8505 | {'pong': 0.7857, 'sonic': 0.8264, 'pole_position': 0.9393}
34
- [06:54:54] New best! SSIM=0.8505
35
- [07:09:06] P2 Epoch 11/30 (steps=8) | loss=0.20872 lr=0.000500
36
- [07:23:28] P2 Epoch 12/30 (steps=8) | loss=0.20396 lr=0.000500
37
- [07:37:46] P2 Epoch 13/30 (steps=8) | loss=0.19839 lr=0.000500
38
- [07:52:00] P2 Epoch 14/30 (steps=8) | loss=0.19479 lr=0.000500
39
- [08:06:23] P2 Epoch 15/30 (steps=8) | loss=0.19129 lr=0.000500
40
- [08:07:46] Val SSIM=0.8759 | {'pong': 0.8609, 'sonic': 0.8246, 'pole_position': 0.9423}
41
- [08:07:46] New best! SSIM=0.8759
42
- [08:22:08] P2 Epoch 16/30 (steps=8) | loss=0.18765 lr=0.000495
43
- [08:36:25] P2 Epoch 17/30 (steps=8) | loss=0.18469 lr=0.000478
44
- [08:50:42] P2 Epoch 18/30 (steps=8) | loss=0.18071 lr=0.000452
45
- [09:04:59] P2 Epoch 19/30 (steps=8) | loss=0.17676 lr=0.000417
46
- [09:19:13] P2 Epoch 20/30 (steps=8) | loss=0.17231 lr=0.000375
47
- [09:20:41] Val SSIM=0.8774 | {'pong': 0.8579, 'sonic': 0.8323, 'pole_position': 0.9419}
48
- [09:20:41] New best! SSIM=0.8774
49
- [09:35:11] P2 Epoch 21/30 (steps=8) | loss=0.16752 lr=0.000327
50
- [09:49:35] P2 Epoch 22/30 (steps=8) | loss=0.16277 lr=0.000276
51
- [10:03:57] P2 Epoch 23/30 (steps=8) | loss=0.15720 lr=0.000224
52
- [10:18:08] P2 Epoch 24/30 (steps=8) | loss=0.15217 lr=0.000173
53
- [10:32:53] P2 Epoch 25/30 (steps=8) | loss=0.14704 lr=0.000125
54
- [10:34:17] Val SSIM=0.8860 | {'pong': 0.876, 'sonic': 0.8357, 'pole_position': 0.9463}
55
- [10:34:17] New best! SSIM=0.8860
56
- [10:49:35] P2 Epoch 26/30 (steps=8) | loss=0.14196 lr=0.000083
57
- [11:04:55] P2 Epoch 27/30 (steps=8) | loss=0.13748 lr=0.000048
58
- [11:20:12] P2 Epoch 28/30 (steps=8) | loss=0.13386 lr=0.000022
59
- [11:35:30] P2 Epoch 29/30 (steps=8) | loss=0.13136 lr=0.000010
60
- [11:49:54] P2 Epoch 30/30 (steps=8) | loss=0.12997 lr=0.000010
61
- [11:51:09] Val SSIM=0.8880 | {'pong': 0.8813, 'sonic': 0.8349, 'pole_position': 0.9479}
62
- [11:51:09] New best! SSIM=0.8880
63
- [11:51:09] Experiment dir: 12.4 MB
64
- [11:51:09] Training complete. Best val SSIM: 0.8880
 
1
+ [12:02:26] Device: cuda
2
+ [12:02:27] Loaded v10 weights from /home/coder/experiments/2026-04-14-080000-multiscale-flow-v10
3
+ [12:02:27] Model parameters: 6,169,586, channels=[56, 112, 224]
4
+ [12:02:27] Fine-tune: 10 epochs of 8-step AR with pure SSIM loss
5
+ [12:02:31] 43855 sequences
6
+ [12:15:01] Epoch 1/10 | loss=0.09345 lr=0.0000098
7
+ [12:27:32] Epoch 2/10 | loss=0.09245 lr=0.0000091
8
+ [12:29:02] Val SSIM=0.8883 | {'pong': 0.8811, 'sonic': 0.8354, 'pole_position': 0.9485}
9
+ [12:29:02] New best! SSIM=0.8883
10
+ [12:41:38] Epoch 3/10 | loss=0.09166 lr=0.0000081
11
+ [12:54:16] Epoch 4/10 | loss=0.09095 lr=0.0000069
12
+ [12:55:36] Val SSIM=0.8887 | {'pong': 0.8824, 'sonic': 0.8352, 'pole_position': 0.9486}
13
+ [12:55:36] New best! SSIM=0.8887
14
+ [13:08:12] Epoch 5/10 | loss=0.09033 lr=0.0000055
15
+ [13:20:56] Epoch 6/10 | loss=0.08982 lr=0.0000041
16
+ [13:22:21] Val SSIM=0.8885 | {'pong': 0.8824, 'sonic': 0.8347, 'pole_position': 0.9483}
17
+ [13:35:14] Epoch 7/10 | loss=0.08941 lr=0.0000029
18
+ [13:48:14] Epoch 8/10 | loss=0.08911 lr=0.0000019
19
+ [13:49:31] Val SSIM=0.8883 | {'pong': 0.8822, 'sonic': 0.8344, 'pole_position': 0.9484}
20
+ [14:02:17] Epoch 9/10 | loss=0.08888 lr=0.0000012
21
+ [14:14:47] Epoch 10/10 | loss=0.08874 lr=0.0000010
22
+ [14:16:07] Val SSIM=0.8881 | {'pong': 0.8815, 'sonic': 0.8343, 'pole_position': 0.9485}
23
+ [14:16:07] Experiment dir: 12.4 MB
24
+ [14:16:07] Training complete. Best val SSIM: 0.8887