hchcsuim commited on
Commit
0b4a7f1
·
verified ·
1 Parent(s): f48f3c3

Training in progress, epoch 0

Browse files
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 0.9975308641975309,
3
+ "total_flos": 3.213382256091464e+17,
4
+ "train_loss": 0.14779486708195494,
5
+ "train_runtime": 540.311,
6
+ "train_samples_per_second": 23.964,
7
+ "train_steps_per_second": 0.374
8
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3bad6f8ccc3f531e7fff91e3b9659a09d0e56bd625f896f719b0a1a7b090da6
3
  size 110342832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33d73e513a17019b6e3757a7f5726b25ef57b79541aaa6c931f78c49bed48634
3
  size 110342832
runs/Jun25_14-15-41_IISC144/events.out.tfevents.1719296148.IISC144.10548.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d57d68afe5f1979de1b986ab2af7a48006724df4769d2125b8ba085fe7a014c
3
+ size 10336
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 0.9975308641975309,
3
+ "total_flos": 3.213382256091464e+17,
4
+ "train_loss": 0.14779486708195494,
5
+ "train_runtime": 540.311,
6
+ "train_samples_per_second": 23.964,
7
+ "train_steps_per_second": 0.374
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,195 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9983008958912574,
3
+ "best_model_checkpoint": "batch-size16_Celeb-DF_opencv-1FPS_faces-expand0-aligned_unaugmentation\\checkpoint-202",
4
+ "epoch": 0.9975308641975309,
5
+ "eval_steps": 500,
6
+ "global_step": 202,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.04938271604938271,
13
+ "grad_norm": 2.2081010341644287,
14
+ "learning_rate": 2.380952380952381e-05,
15
+ "loss": 0.5797,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.09876543209876543,
20
+ "grad_norm": 1.9404168128967285,
21
+ "learning_rate": 4.761904761904762e-05,
22
+ "loss": 0.4365,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 0.14814814814814814,
27
+ "grad_norm": 4.0794453620910645,
28
+ "learning_rate": 4.751381215469613e-05,
29
+ "loss": 0.4103,
30
+ "step": 30
31
+ },
32
+ {
33
+ "epoch": 0.19753086419753085,
34
+ "grad_norm": 24.15789794921875,
35
+ "learning_rate": 4.475138121546962e-05,
36
+ "loss": 0.3143,
37
+ "step": 40
38
+ },
39
+ {
40
+ "epoch": 0.24691358024691357,
41
+ "grad_norm": 7.551469326019287,
42
+ "learning_rate": 4.1988950276243096e-05,
43
+ "loss": 0.185,
44
+ "step": 50
45
+ },
46
+ {
47
+ "epoch": 0.2962962962962963,
48
+ "grad_norm": 13.123407363891602,
49
+ "learning_rate": 3.9226519337016574e-05,
50
+ "loss": 0.1535,
51
+ "step": 60
52
+ },
53
+ {
54
+ "epoch": 0.345679012345679,
55
+ "grad_norm": 53.75169372558594,
56
+ "learning_rate": 3.646408839779006e-05,
57
+ "loss": 0.2063,
58
+ "step": 70
59
+ },
60
+ {
61
+ "epoch": 0.3950617283950617,
62
+ "grad_norm": 5.172009468078613,
63
+ "learning_rate": 3.370165745856354e-05,
64
+ "loss": 0.113,
65
+ "step": 80
66
+ },
67
+ {
68
+ "epoch": 0.4444444444444444,
69
+ "grad_norm": 6.01790714263916,
70
+ "learning_rate": 3.0939226519337016e-05,
71
+ "loss": 0.0534,
72
+ "step": 90
73
+ },
74
+ {
75
+ "epoch": 0.49382716049382713,
76
+ "grad_norm": 3.071531295776367,
77
+ "learning_rate": 2.8176795580110498e-05,
78
+ "loss": 0.063,
79
+ "step": 100
80
+ },
81
+ {
82
+ "epoch": 0.5432098765432098,
83
+ "grad_norm": 12.023387908935547,
84
+ "learning_rate": 2.541436464088398e-05,
85
+ "loss": 0.0826,
86
+ "step": 110
87
+ },
88
+ {
89
+ "epoch": 0.5925925925925926,
90
+ "grad_norm": 7.534938335418701,
91
+ "learning_rate": 2.265193370165746e-05,
92
+ "loss": 0.0631,
93
+ "step": 120
94
+ },
95
+ {
96
+ "epoch": 0.6419753086419753,
97
+ "grad_norm": 1.6553133726119995,
98
+ "learning_rate": 1.988950276243094e-05,
99
+ "loss": 0.0531,
100
+ "step": 130
101
+ },
102
+ {
103
+ "epoch": 0.691358024691358,
104
+ "grad_norm": 14.167679786682129,
105
+ "learning_rate": 1.712707182320442e-05,
106
+ "loss": 0.0559,
107
+ "step": 140
108
+ },
109
+ {
110
+ "epoch": 0.7407407407407407,
111
+ "grad_norm": 2.242429494857788,
112
+ "learning_rate": 1.4364640883977901e-05,
113
+ "loss": 0.0454,
114
+ "step": 150
115
+ },
116
+ {
117
+ "epoch": 0.7901234567901234,
118
+ "grad_norm": 4.238832950592041,
119
+ "learning_rate": 1.1602209944751381e-05,
120
+ "loss": 0.0468,
121
+ "step": 160
122
+ },
123
+ {
124
+ "epoch": 0.8395061728395061,
125
+ "grad_norm": 2.1989619731903076,
126
+ "learning_rate": 8.839779005524863e-06,
127
+ "loss": 0.0289,
128
+ "step": 170
129
+ },
130
+ {
131
+ "epoch": 0.8888888888888888,
132
+ "grad_norm": 13.035294532775879,
133
+ "learning_rate": 6.077348066298343e-06,
134
+ "loss": 0.0394,
135
+ "step": 180
136
+ },
137
+ {
138
+ "epoch": 0.9382716049382716,
139
+ "grad_norm": 9.14392375946045,
140
+ "learning_rate": 3.314917127071823e-06,
141
+ "loss": 0.0332,
142
+ "step": 190
143
+ },
144
+ {
145
+ "epoch": 0.9876543209876543,
146
+ "grad_norm": 2.9875118732452393,
147
+ "learning_rate": 5.524861878453039e-07,
148
+ "loss": 0.0172,
149
+ "step": 200
150
+ },
151
+ {
152
+ "epoch": 0.9975308641975309,
153
+ "eval_accuracy": 0.9983008958912574,
154
+ "eval_f1": 0.9989828000739782,
155
+ "eval_loss": 0.005187882110476494,
156
+ "eval_precision": 1.0,
157
+ "eval_recall": 0.9979676674364896,
158
+ "eval_roc_auc": 0.9999986075741439,
159
+ "eval_runtime": 224.8904,
160
+ "eval_samples_per_second": 57.575,
161
+ "eval_steps_per_second": 3.602,
162
+ "step": 202
163
+ },
164
+ {
165
+ "epoch": 0.9975308641975309,
166
+ "step": 202,
167
+ "total_flos": 3.213382256091464e+17,
168
+ "train_loss": 0.14779486708195494,
169
+ "train_runtime": 540.311,
170
+ "train_samples_per_second": 23.964,
171
+ "train_steps_per_second": 0.374
172
+ }
173
+ ],
174
+ "logging_steps": 10,
175
+ "max_steps": 202,
176
+ "num_input_tokens_seen": 0,
177
+ "num_train_epochs": 1,
178
+ "save_steps": 500,
179
+ "stateful_callbacks": {
180
+ "TrainerControl": {
181
+ "args": {
182
+ "should_epoch_stop": false,
183
+ "should_evaluate": false,
184
+ "should_log": false,
185
+ "should_save": true,
186
+ "should_training_stop": true
187
+ },
188
+ "attributes": {}
189
+ }
190
+ },
191
+ "total_flos": 3.213382256091464e+17,
192
+ "train_batch_size": 16,
193
+ "trial_name": null,
194
+ "trial_params": null
195
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8e70a7aef3a9a126a7fedc32060aba03ca008450465ae3ad90d9a326e109c76
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86f481145c09d2b88147c78feab5df8c3d58df1b825f92f801a437de7c4df2b3
3
  size 5240