nguyenkhoa commited on
Commit
d9c98dd
·
verified ·
1 Parent(s): 4000549

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +5 -5
  2. train_results.json +5 -5
  3. trainer_state.json +280 -80
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "total_flos": 1.9921933677868186e+18,
4
- "train_loss": 0.18438913027445475,
5
- "train_runtime": 4974.1556,
6
- "train_samples_per_second": 80.416,
7
- "train_steps_per_second": 0.106
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "total_flos": 3.9844365410304e+18,
4
+ "train_loss": 0.024235197260048972,
5
+ "train_runtime": 18042.9659,
6
+ "train_samples_per_second": 44.339,
7
+ "train_steps_per_second": 0.058
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "total_flos": 1.9921933677868186e+18,
4
- "train_loss": 0.18438913027445475,
5
- "train_runtime": 4974.1556,
6
- "train_samples_per_second": 80.416,
7
- "train_steps_per_second": 0.106
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "total_flos": 3.9844365410304e+18,
4
+ "train_loss": 0.024235197260048972,
5
+ "train_runtime": 18042.9659,
6
+ "train_samples_per_second": 44.339,
7
+ "train_steps_per_second": 0.058
8
  }
trainer_state.json CHANGED
@@ -1,132 +1,332 @@
1
  {
2
- "best_metric": 0.028903182595968246,
3
- "best_model_checkpoint": "./dinov2_Liveness_detection_v2.2.2/checkpoint-512",
4
  "epoch": 5.0,
5
- "eval_steps": 128,
6
- "global_step": 525,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.6095238095238096,
13
- "grad_norm": 31.397323608398438,
14
- "learning_rate": 4.428571428571428e-05,
15
- "loss": 0.8952,
16
  "step": 64
17
  },
18
  {
19
- "epoch": 1.2190476190476192,
20
- "grad_norm": 32.01212692260742,
21
- "learning_rate": 3.8190476190476196e-05,
22
- "loss": 0.266,
 
 
 
 
 
 
 
 
 
 
 
 
23
  "step": 128
24
  },
25
  {
26
- "epoch": 1.2190476190476192,
27
- "eval_accuracy": 0.942,
28
- "eval_f1": 0.9424224282926646,
29
- "eval_loss": 0.1499282419681549,
30
- "eval_precision": 0.9420692134831461,
31
- "eval_recall": 0.942,
32
- "eval_runtime": 220.5479,
33
- "eval_samples_per_second": 90.683,
34
- "eval_steps_per_second": 11.335,
35
  "step": 128
36
  },
37
  {
38
- "epoch": 1.8285714285714287,
39
- "grad_norm": 29.405466079711914,
40
- "learning_rate": 3.2095238095238095e-05,
41
- "loss": 0.1497,
 
 
 
 
 
 
 
 
 
 
 
 
42
  "step": 192
43
  },
44
  {
45
- "epoch": 2.4380952380952383,
46
- "grad_norm": 8.088194847106934,
47
- "learning_rate": 2.6000000000000002e-05,
48
- "loss": 0.0929,
49
  "step": 256
50
  },
51
  {
52
- "epoch": 2.4380952380952383,
53
- "eval_accuracy": 0.95735,
54
- "eval_f1": 0.9578785031500121,
55
- "eval_loss": 0.12672634422779083,
56
- "eval_precision": 0.9593868981160767,
57
- "eval_recall": 0.95735,
58
- "eval_runtime": 209.2644,
59
- "eval_samples_per_second": 95.573,
60
- "eval_steps_per_second": 11.947,
61
  "step": 256
62
  },
63
  {
64
- "epoch": 3.0476190476190474,
65
- "grad_norm": 27.274545669555664,
66
- "learning_rate": 1.9904761904761908e-05,
67
- "loss": 0.0533,
68
  "step": 320
69
  },
70
  {
71
- "epoch": 3.657142857142857,
72
- "grad_norm": 7.902669906616211,
73
- "learning_rate": 1.3809523809523811e-05,
74
- "loss": 0.0298,
 
 
 
 
 
 
 
 
 
 
 
 
75
  "step": 384
76
  },
77
  {
78
- "epoch": 3.657142857142857,
79
- "eval_accuracy": 0.9888,
80
- "eval_f1": 0.9887893352142478,
81
- "eval_loss": 0.030348431318998337,
82
- "eval_precision": 0.9888352116245671,
83
- "eval_recall": 0.9888,
84
- "eval_runtime": 205.3865,
85
- "eval_samples_per_second": 97.377,
86
- "eval_steps_per_second": 12.172,
87
  "step": 384
88
  },
89
  {
90
- "epoch": 4.266666666666667,
91
- "grad_norm": 4.974146366119385,
92
- "learning_rate": 7.714285714285714e-06,
93
- "loss": 0.0159,
 
 
 
 
 
 
 
 
 
 
 
 
94
  "step": 448
95
  },
96
  {
97
- "epoch": 4.876190476190477,
98
- "grad_norm": 9.068910598754883,
99
- "learning_rate": 1.619047619047619e-06,
100
- "loss": 0.0083,
101
  "step": 512
102
  },
103
  {
104
- "epoch": 4.876190476190477,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
105
  "eval_accuracy": 0.99155,
106
- "eval_f1": 0.9915498405407145,
107
- "eval_loss": 0.028903182595968246,
108
- "eval_precision": 0.9915503244910029,
109
  "eval_recall": 0.99155,
110
- "eval_runtime": 209.0101,
111
- "eval_samples_per_second": 95.689,
112
- "eval_steps_per_second": 11.961,
113
- "step": 512
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
114
  },
115
  {
116
  "epoch": 5.0,
117
- "step": 525,
118
- "total_flos": 1.9921933677868186e+18,
119
- "train_loss": 0.18438913027445475,
120
- "train_runtime": 4974.1556,
121
- "train_samples_per_second": 80.416,
122
- "train_steps_per_second": 0.106
123
  }
124
  ],
125
  "logging_steps": 64,
126
- "max_steps": 525,
127
  "num_input_tokens_seen": 0,
128
  "num_train_epochs": 5,
129
- "save_steps": 128,
130
  "stateful_callbacks": {
131
  "TrainerControl": {
132
  "args": {
@@ -139,7 +339,7 @@
139
  "attributes": {}
140
  }
141
  },
142
- "total_flos": 1.9921933677868186e+18,
143
  "train_batch_size": 768,
144
  "trial_name": null,
145
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.021851040422916412,
3
+ "best_model_checkpoint": "./dinov2_Liveness_detection_v2.2.2/checkpoint-960",
4
  "epoch": 5.0,
5
+ "eval_steps": 64,
6
+ "global_step": 1045,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.3062200956937799,
13
+ "grad_norm": 16.814943313598633,
14
+ "learning_rate": 4.6985645933014356e-05,
15
+ "loss": 0.069,
16
  "step": 64
17
  },
18
  {
19
+ "epoch": 0.3062200956937799,
20
+ "eval_accuracy": 0.97885,
21
+ "eval_f1": 0.9789501971935628,
22
+ "eval_loss": 0.05791417136788368,
23
+ "eval_precision": 0.9790213884696916,
24
+ "eval_recall": 0.97885,
25
+ "eval_runtime": 521.502,
26
+ "eval_samples_per_second": 76.702,
27
+ "eval_steps_per_second": 9.588,
28
+ "step": 64
29
+ },
30
+ {
31
+ "epoch": 0.6124401913875598,
32
+ "grad_norm": 11.042802810668945,
33
+ "learning_rate": 4.3923444976076554e-05,
34
+ "loss": 0.0482,
35
  "step": 128
36
  },
37
  {
38
+ "epoch": 0.6124401913875598,
39
+ "eval_accuracy": 0.981375,
40
+ "eval_f1": 0.9814562696359047,
41
+ "eval_loss": 0.05181511119008064,
42
+ "eval_precision": 0.9815262980731044,
43
+ "eval_recall": 0.981375,
44
+ "eval_runtime": 517.0571,
45
+ "eval_samples_per_second": 77.361,
46
+ "eval_steps_per_second": 9.67,
47
  "step": 128
48
  },
49
  {
50
+ "epoch": 0.9186602870813397,
51
+ "grad_norm": 5.2479634284973145,
52
+ "learning_rate": 4.086124401913876e-05,
53
+ "loss": 0.0404,
54
+ "step": 192
55
+ },
56
+ {
57
+ "epoch": 0.9186602870813397,
58
+ "eval_accuracy": 0.9882,
59
+ "eval_f1": 0.9881867637379899,
60
+ "eval_loss": 0.032511744648218155,
61
+ "eval_precision": 0.9882451896307357,
62
+ "eval_recall": 0.9882,
63
+ "eval_runtime": 490.7248,
64
+ "eval_samples_per_second": 81.512,
65
+ "eval_steps_per_second": 10.189,
66
  "step": 192
67
  },
68
  {
69
+ "epoch": 1.2248803827751196,
70
+ "grad_norm": 3.8472037315368652,
71
+ "learning_rate": 3.7799043062200956e-05,
72
+ "loss": 0.0325,
73
  "step": 256
74
  },
75
  {
76
+ "epoch": 1.2248803827751196,
77
+ "eval_accuracy": 0.98545,
78
+ "eval_f1": 0.985494798685368,
79
+ "eval_loss": 0.04072735831141472,
80
+ "eval_precision": 0.9855132158274779,
81
+ "eval_recall": 0.98545,
82
+ "eval_runtime": 466.7395,
83
+ "eval_samples_per_second": 85.701,
84
+ "eval_steps_per_second": 10.713,
85
  "step": 256
86
  },
87
  {
88
+ "epoch": 1.5311004784688995,
89
+ "grad_norm": 4.665475368499756,
90
+ "learning_rate": 3.473684210526316e-05,
91
+ "loss": 0.0322,
92
  "step": 320
93
  },
94
  {
95
+ "epoch": 1.5311004784688995,
96
+ "eval_accuracy": 0.99015,
97
+ "eval_f1": 0.990145076314261,
98
+ "eval_loss": 0.028076525777578354,
99
+ "eval_precision": 0.9901636180839065,
100
+ "eval_recall": 0.99015,
101
+ "eval_runtime": 480.6976,
102
+ "eval_samples_per_second": 83.212,
103
+ "eval_steps_per_second": 10.402,
104
+ "step": 320
105
+ },
106
+ {
107
+ "epoch": 1.8373205741626795,
108
+ "grad_norm": 5.757445335388184,
109
+ "learning_rate": 3.1674641148325365e-05,
110
+ "loss": 0.0283,
111
  "step": 384
112
  },
113
  {
114
+ "epoch": 1.8373205741626795,
115
+ "eval_accuracy": 0.988425,
116
+ "eval_f1": 0.9884000225035877,
117
+ "eval_loss": 0.0346578024327755,
118
+ "eval_precision": 0.9885429088726858,
119
+ "eval_recall": 0.988425,
120
+ "eval_runtime": 483.3989,
121
+ "eval_samples_per_second": 82.747,
122
+ "eval_steps_per_second": 10.343,
123
  "step": 384
124
  },
125
  {
126
+ "epoch": 2.1435406698564594,
127
+ "grad_norm": 2.869988203048706,
128
+ "learning_rate": 2.8612440191387562e-05,
129
+ "loss": 0.0256,
130
+ "step": 448
131
+ },
132
+ {
133
+ "epoch": 2.1435406698564594,
134
+ "eval_accuracy": 0.990725,
135
+ "eval_f1": 0.9907227766051799,
136
+ "eval_loss": 0.027070404961705208,
137
+ "eval_precision": 0.9907303189959034,
138
+ "eval_recall": 0.990725,
139
+ "eval_runtime": 480.102,
140
+ "eval_samples_per_second": 83.316,
141
+ "eval_steps_per_second": 10.414,
142
  "step": 448
143
  },
144
  {
145
+ "epoch": 2.449760765550239,
146
+ "grad_norm": 4.530367374420166,
147
+ "learning_rate": 2.5550239234449763e-05,
148
+ "loss": 0.0207,
149
  "step": 512
150
  },
151
  {
152
+ "epoch": 2.449760765550239,
153
+ "eval_accuracy": 0.987375,
154
+ "eval_f1": 0.9873992902183978,
155
+ "eval_loss": 0.035906460136175156,
156
+ "eval_precision": 0.9873848219691154,
157
+ "eval_recall": 0.987375,
158
+ "eval_runtime": 485.3186,
159
+ "eval_samples_per_second": 82.42,
160
+ "eval_steps_per_second": 10.303,
161
+ "step": 512
162
+ },
163
+ {
164
+ "epoch": 2.7559808612440193,
165
+ "grad_norm": 2.7303965091705322,
166
+ "learning_rate": 2.2488038277511964e-05,
167
+ "loss": 0.0192,
168
+ "step": 576
169
+ },
170
+ {
171
+ "epoch": 2.7559808612440193,
172
+ "eval_accuracy": 0.99165,
173
+ "eval_f1": 0.9916437240635789,
174
+ "eval_loss": 0.025301363319158554,
175
+ "eval_precision": 0.9916710521622637,
176
+ "eval_recall": 0.99165,
177
+ "eval_runtime": 481.2714,
178
+ "eval_samples_per_second": 83.113,
179
+ "eval_steps_per_second": 10.389,
180
+ "step": 576
181
+ },
182
+ {
183
+ "epoch": 3.062200956937799,
184
+ "grad_norm": 2.5271918773651123,
185
+ "learning_rate": 1.9425837320574165e-05,
186
+ "loss": 0.017,
187
+ "step": 640
188
+ },
189
+ {
190
+ "epoch": 3.062200956937799,
191
+ "eval_accuracy": 0.9908,
192
+ "eval_f1": 0.9908068152778651,
193
+ "eval_loss": 0.02719452604651451,
194
+ "eval_precision": 0.9907948609341658,
195
+ "eval_recall": 0.9908,
196
+ "eval_runtime": 486.6359,
197
+ "eval_samples_per_second": 82.197,
198
+ "eval_steps_per_second": 10.275,
199
+ "step": 640
200
+ },
201
+ {
202
+ "epoch": 3.3684210526315788,
203
+ "grad_norm": 3.4637880325317383,
204
+ "learning_rate": 1.6363636363636366e-05,
205
+ "loss": 0.0134,
206
+ "step": 704
207
+ },
208
+ {
209
+ "epoch": 3.3684210526315788,
210
  "eval_accuracy": 0.99155,
211
+ "eval_f1": 0.991553221477779,
212
+ "eval_loss": 0.025475142523646355,
213
+ "eval_precision": 0.9915457922828868,
214
  "eval_recall": 0.99155,
215
+ "eval_runtime": 487.284,
216
+ "eval_samples_per_second": 82.088,
217
+ "eval_steps_per_second": 10.261,
218
+ "step": 704
219
+ },
220
+ {
221
+ "epoch": 3.674641148325359,
222
+ "grad_norm": 2.8516900539398193,
223
+ "learning_rate": 1.3301435406698565e-05,
224
+ "loss": 0.0132,
225
+ "step": 768
226
+ },
227
+ {
228
+ "epoch": 3.674641148325359,
229
+ "eval_accuracy": 0.9925,
230
+ "eval_f1": 0.9924949448411151,
231
+ "eval_loss": 0.023235656321048737,
232
+ "eval_precision": 0.9925169638113596,
233
+ "eval_recall": 0.9925,
234
+ "eval_runtime": 489.1056,
235
+ "eval_samples_per_second": 81.782,
236
+ "eval_steps_per_second": 10.223,
237
+ "step": 768
238
+ },
239
+ {
240
+ "epoch": 3.9808612440191387,
241
+ "grad_norm": 2.9499707221984863,
242
+ "learning_rate": 1.0239234449760766e-05,
243
+ "loss": 0.0114,
244
+ "step": 832
245
+ },
246
+ {
247
+ "epoch": 3.9808612440191387,
248
+ "eval_accuracy": 0.99185,
249
+ "eval_f1": 0.9918568051307793,
250
+ "eval_loss": 0.026025714352726936,
251
+ "eval_precision": 0.9918472125621515,
252
+ "eval_recall": 0.99185,
253
+ "eval_runtime": 486.1176,
254
+ "eval_samples_per_second": 82.285,
255
+ "eval_steps_per_second": 10.286,
256
+ "step": 832
257
+ },
258
+ {
259
+ "epoch": 4.287081339712919,
260
+ "grad_norm": 3.4067459106445312,
261
+ "learning_rate": 7.177033492822967e-06,
262
+ "loss": 0.0074,
263
+ "step": 896
264
+ },
265
+ {
266
+ "epoch": 4.287081339712919,
267
+ "eval_accuracy": 0.992725,
268
+ "eval_f1": 0.9927214337347136,
269
+ "eval_loss": 0.024225549772381783,
270
+ "eval_precision": 0.9927357715365919,
271
+ "eval_recall": 0.992725,
272
+ "eval_runtime": 482.0799,
273
+ "eval_samples_per_second": 82.974,
274
+ "eval_steps_per_second": 10.372,
275
+ "step": 896
276
+ },
277
+ {
278
+ "epoch": 4.5933014354066986,
279
+ "grad_norm": 3.6422884464263916,
280
+ "learning_rate": 4.114832535885168e-06,
281
+ "loss": 0.0079,
282
+ "step": 960
283
+ },
284
+ {
285
+ "epoch": 4.5933014354066986,
286
+ "eval_accuracy": 0.99315,
287
+ "eval_f1": 0.9931459136485375,
288
+ "eval_loss": 0.021851040422916412,
289
+ "eval_precision": 0.9931635536599013,
290
+ "eval_recall": 0.99315,
291
+ "eval_runtime": 488.3316,
292
+ "eval_samples_per_second": 81.912,
293
+ "eval_steps_per_second": 10.239,
294
+ "step": 960
295
+ },
296
+ {
297
+ "epoch": 4.899521531100478,
298
+ "grad_norm": 4.330822467803955,
299
+ "learning_rate": 1.0526315789473685e-06,
300
+ "loss": 0.0072,
301
+ "step": 1024
302
+ },
303
+ {
304
+ "epoch": 4.899521531100478,
305
+ "eval_accuracy": 0.993425,
306
+ "eval_f1": 0.9934216498623175,
307
+ "eval_loss": 0.02193431928753853,
308
+ "eval_precision": 0.9934356337892436,
309
+ "eval_recall": 0.993425,
310
+ "eval_runtime": 492.599,
311
+ "eval_samples_per_second": 81.202,
312
+ "eval_steps_per_second": 10.15,
313
+ "step": 1024
314
  },
315
  {
316
  "epoch": 5.0,
317
+ "step": 1045,
318
+ "total_flos": 3.9844365410304e+18,
319
+ "train_loss": 0.024235197260048972,
320
+ "train_runtime": 18042.9659,
321
+ "train_samples_per_second": 44.339,
322
+ "train_steps_per_second": 0.058
323
  }
324
  ],
325
  "logging_steps": 64,
326
+ "max_steps": 1045,
327
  "num_input_tokens_seen": 0,
328
  "num_train_epochs": 5,
329
+ "save_steps": 64,
330
  "stateful_callbacks": {
331
  "TrainerControl": {
332
  "args": {
 
339
  "attributes": {}
340
  }
341
  },
342
+ "total_flos": 3.9844365410304e+18,
343
  "train_batch_size": 768,
344
  "trial_name": null,
345
  "trial_params": null