haeylee commited on
Commit
03f4184
·
verified ·
1 Parent(s): 7603b96
wav2vec2/freeze/02_wav2vec2-large-960-h/all_results.json DELETED
@@ -1,21 +0,0 @@
1
- {
2
- "epoch": 30.0,
3
- "eval_loss": 1.2460167407989502,
4
- "eval_mse_0": 1.4599828720092773,
5
- "eval_mse_1": 1.062279224395752,
6
- "eval_mse_2": 1.073793888092041,
7
- "eval_mse_3": 1.3880120515823364,
8
- "eval_pcc_0": 0.7018509725629924,
9
- "eval_pcc_1": 0.7738516252096618,
10
- "eval_pcc_2": 0.774751106649783,
11
- "eval_pcc_3": 0.7272315825392802,
12
- "eval_runtime": 101.0766,
13
- "eval_samples": 2500,
14
- "eval_samples_per_second": 24.734,
15
- "eval_steps_per_second": 3.097,
16
- "train_loss": 1.2372805285631532,
17
- "train_runtime": 9022.2383,
18
- "train_samples": 2500,
19
- "train_samples_per_second": 8.313,
20
- "train_steps_per_second": 1.041
21
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/args.json DELETED
@@ -1,11 +0,0 @@
1
- {
2
- "batch_size": 4,
3
- "model_name": "facebook/wav2vec2-large-960h",
4
- "learning_rate": 1e-05,
5
- "num_train_epochs": 30,
6
- "save_dir": "./cnnfreeze/model_saved",
7
- "freeze_feature_extractor": true,
8
- "exp_name": "facebook/wav2vec2-large-960h_lr1e-05_epochs30_batch4",
9
- "save_dir_path": "./cnnfreeze/model_saved/facebook/wav2vec2-large-960h_lr1e-05_epochs30_batch4",
10
- "save_log_path": "./cnnfreeze/model_saved/logs/facebook/wav2vec2-large-960h_lr1e-05_epochs30_batch4"
11
- }
 
 
 
 
 
 
 
 
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/eval_results.json DELETED
@@ -1,16 +0,0 @@
1
- {
2
- "epoch": 30.0,
3
- "eval_loss": 1.2460167407989502,
4
- "eval_mse_0": 1.4599828720092773,
5
- "eval_mse_1": 1.062279224395752,
6
- "eval_mse_2": 1.073793888092041,
7
- "eval_mse_3": 1.3880120515823364,
8
- "eval_pcc_0": 0.7018509725629924,
9
- "eval_pcc_1": 0.7738516252096618,
10
- "eval_pcc_2": 0.774751106649783,
11
- "eval_pcc_3": 0.7272315825392802,
12
- "eval_runtime": 101.0766,
13
- "eval_samples": 2500,
14
- "eval_samples_per_second": 24.734,
15
- "eval_steps_per_second": 3.097
16
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/finetuned_pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a17755e281bc8df110476e18574a87297dd3efe05f9cdf712a40e93c72970831
3
- size 1261896664
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3797c5338685801534e7124ecb5897d3cd78c006309a982c3a7d73863a0a6288
3
- size 1261781352
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/model_weights.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe96bed2ee957b4f85f619fbbb2ea524cc9773314cd010f433f7a53baff487fb
3
- size 1261892510
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/preprocessor_config.json DELETED
@@ -1,9 +0,0 @@
1
- {
2
- "do_normalize": true,
3
- "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
- "feature_size": 1,
5
- "padding_side": "right",
6
- "padding_value": 0.0,
7
- "return_attention_mask": false,
8
- "sampling_rate": 16000
9
- }
 
 
 
 
 
 
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/train_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 30.0,
3
- "train_loss": 1.2372805285631532,
4
- "train_runtime": 9022.2383,
5
- "train_samples": 2500,
6
- "train_samples_per_second": 8.313,
7
- "train_steps_per_second": 1.041
8
- }
 
 
 
 
 
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/trainer_args.json DELETED
@@ -1 +0,0 @@
1
- {"output_dir": "./cnnfreeze/model_saved/facebook/wav2vec2-large-960h_lr1e-05_epochs30_batch4", "overwrite_output_dir": false, "do_train": false, "do_eval": true, "do_predict": false, "evaluation_strategy": "epoch", "prediction_loss_only": false, "per_device_train_batch_size": 4, "per_device_eval_batch_size": 4, "per_gpu_train_batch_size": null, "per_gpu_eval_batch_size": null, "gradient_accumulation_steps": 1, "eval_accumulation_steps": null, "eval_delay": 0, "learning_rate": 1e-05, "weight_decay": 0.0, "adam_beta1": 0.9, "adam_beta2": 0.999, "adam_epsilon": 1e-08, "max_grad_norm": 1.0, "num_train_epochs": 30, "max_steps": -1, "lr_scheduler_type": "linear", "lr_scheduler_kwargs": {}, "warmup_ratio": 0.0, "warmup_steps": 0, "log_level": "info", "log_level_replica": "warning", "log_on_each_node": true, "logging_dir": "./cnnfreeze/model_saved/logs/facebook/wav2vec2-large-960h_lr1e-05_epochs30_batch4", "logging_strategy": "steps", "logging_first_step": false, "logging_steps": 500, "logging_nan_inf_filter": true, "save_strategy": "epoch", "save_steps": 500, "save_total_limit": 3, "save_safetensors": true, "save_on_each_node": false, "save_only_model": false, "no_cuda": false, "use_cpu": false, "use_mps_device": false, "seed": 42, "data_seed": null, "jit_mode_eval": false, "use_ipex": false, "bf16": false, "fp16": false, "fp16_opt_level": "O1", "half_precision_backend": "auto", "bf16_full_eval": false, "fp16_full_eval": false, "tf32": null, "local_rank": 0, "ddp_backend": null, "tpu_num_cores": null, "tpu_metrics_debug": false, "debug": [], "dataloader_drop_last": false, "eval_steps": null, "dataloader_num_workers": 0, "past_index": -1, "run_name": "./cnnfreeze/model_saved/facebook/wav2vec2-large-960h_lr1e-05_epochs30_batch4", "disable_tqdm": false, "remove_unused_columns": true, "label_names": null, "load_best_model_at_end": false, "metric_for_best_model": null, "greater_is_better": null, "ignore_data_skip": false, "fsdp": [], "fsdp_min_num_params": 0, "fsdp_config": {"min_num_params": 0, "xla": false, "xla_fsdp_grad_ckpt": false}, "fsdp_transformer_layer_cls_to_wrap": null, "deepspeed": null, "label_smoothing_factor": 0.0, "optim": "adamw_torch", "optim_args": null, "adafactor": false, "group_by_length": false, "length_column_name": "length", "report_to": ["tensorboard"], "ddp_find_unused_parameters": null, "ddp_bucket_cap_mb": null, "ddp_broadcast_buffers": null, "dataloader_pin_memory": true, "dataloader_persistent_workers": false, "skip_memory_metrics": true, "use_legacy_prediction_loop": false, "push_to_hub": false, "resume_from_checkpoint": null, "hub_model_id": null, "hub_strategy": "every_save", "hub_token": "<HUB_TOKEN>", "hub_private_repo": false, "hub_always_push": false, "gradient_checkpointing": false, "gradient_checkpointing_kwargs": null, "include_inputs_for_metrics": false, "fp16_backend": "auto", "push_to_hub_model_id": null, "push_to_hub_organization": null, "push_to_hub_token": "<PUSH_TO_HUB_TOKEN>", "mp_parameters": "", "auto_find_batch_size": false, "full_determinism": false, "torchdynamo": null, "ray_scope": "last", "ddp_timeout": 1800, "torch_compile": false, "torch_compile_backend": null, "torch_compile_mode": null, "dispatch_batches": null, "split_batches": false, "include_tokens_per_second": false, "include_num_input_tokens_seen": false, "neftune_noise_alpha": null}
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/trainer_state.json DELETED
@@ -1,618 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 30.0,
5
- "eval_steps": 500,
6
- "global_step": 9390,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 1.0,
13
- "eval_loss": 4.46884298324585,
14
- "eval_mse_0": 4.556619167327881,
15
- "eval_mse_1": 4.266129493713379,
16
- "eval_mse_2": 4.532381057739258,
17
- "eval_mse_3": 4.520243167877197,
18
- "eval_pcc_0": -0.1200762895413838,
19
- "eval_pcc_1": -0.008083556391114409,
20
- "eval_pcc_2": -0.00288564105688843,
21
- "eval_pcc_3": -0.07375013745739004,
22
- "eval_runtime": 102.731,
23
- "eval_samples_per_second": 24.335,
24
- "eval_steps_per_second": 3.047,
25
- "step": 313
26
- },
27
- {
28
- "epoch": 1.6,
29
- "learning_rate": 9.467518636847711e-06,
30
- "loss": 11.3525,
31
- "step": 500
32
- },
33
- {
34
- "epoch": 2.0,
35
- "eval_loss": 2.2717549800872803,
36
- "eval_mse_0": 2.484067678451538,
37
- "eval_mse_1": 2.05204439163208,
38
- "eval_mse_2": 2.0998952388763428,
39
- "eval_mse_3": 2.45101261138916,
40
- "eval_pcc_0": -0.11671111695287814,
41
- "eval_pcc_1": -0.2033763027995093,
42
- "eval_pcc_2": 0.30446639735308567,
43
- "eval_pcc_3": -0.22165009839512184,
44
- "eval_runtime": 101.4114,
45
- "eval_samples_per_second": 24.652,
46
- "eval_steps_per_second": 3.086,
47
- "step": 626
48
- },
49
- {
50
- "epoch": 3.0,
51
- "eval_loss": 2.2065045833587646,
52
- "eval_mse_0": 2.447479009628296,
53
- "eval_mse_1": 1.972946286201477,
54
- "eval_mse_2": 2.003359317779541,
55
- "eval_mse_3": 2.4022369384765625,
56
- "eval_pcc_0": 0.18293676920695143,
57
- "eval_pcc_1": 0.21790504805056626,
58
- "eval_pcc_2": 0.18452597141460383,
59
- "eval_pcc_3": 0.20256941748505725,
60
- "eval_runtime": 101.461,
61
- "eval_samples_per_second": 24.64,
62
- "eval_steps_per_second": 3.085,
63
- "step": 939
64
- },
65
- {
66
- "epoch": 3.19,
67
- "learning_rate": 8.935037273695422e-06,
68
- "loss": 2.7334,
69
- "step": 1000
70
- },
71
- {
72
- "epoch": 4.0,
73
- "eval_loss": 1.9920305013656616,
74
- "eval_mse_0": 2.111795425415039,
75
- "eval_mse_1": 1.8264304399490356,
76
- "eval_mse_2": 1.8920977115631104,
77
- "eval_mse_3": 2.137789249420166,
78
- "eval_pcc_0": 0.34792562797032606,
79
- "eval_pcc_1": 0.38141477981177124,
80
- "eval_pcc_2": 0.38079053034971305,
81
- "eval_pcc_3": 0.3478694471584418,
82
- "eval_runtime": 101.1374,
83
- "eval_samples_per_second": 24.719,
84
- "eval_steps_per_second": 3.095,
85
- "step": 1252
86
- },
87
- {
88
- "epoch": 4.79,
89
- "learning_rate": 8.402555910543132e-06,
90
- "loss": 1.8436,
91
- "step": 1500
92
- },
93
- {
94
- "epoch": 5.0,
95
- "eval_loss": 1.509245753288269,
96
- "eval_mse_0": 1.6858148574829102,
97
- "eval_mse_1": 1.3374269008636475,
98
- "eval_mse_2": 1.3511474132537842,
99
- "eval_mse_3": 1.6625945568084717,
100
- "eval_pcc_0": 0.5746034644728661,
101
- "eval_pcc_1": 0.6057685456658796,
102
- "eval_pcc_2": 0.5941913933632681,
103
- "eval_pcc_3": 0.5815709152115393,
104
- "eval_runtime": 101.1548,
105
- "eval_samples_per_second": 24.715,
106
- "eval_steps_per_second": 3.094,
107
- "step": 1565
108
- },
109
- {
110
- "epoch": 6.0,
111
- "eval_loss": 1.220288872718811,
112
- "eval_mse_0": 1.3848838806152344,
113
- "eval_mse_1": 1.0677039623260498,
114
- "eval_mse_2": 1.058583378791809,
115
- "eval_mse_3": 1.3699851036071777,
116
- "eval_pcc_0": 0.6463640436429148,
117
- "eval_pcc_1": 0.7036960582986487,
118
- "eval_pcc_2": 0.70144206574631,
119
- "eval_pcc_3": 0.6562105416443055,
120
- "eval_runtime": 100.779,
121
- "eval_samples_per_second": 24.807,
122
- "eval_steps_per_second": 3.106,
123
- "step": 1878
124
- },
125
- {
126
- "epoch": 6.39,
127
- "learning_rate": 7.870074547390843e-06,
128
- "loss": 1.1453,
129
- "step": 2000
130
- },
131
- {
132
- "epoch": 7.0,
133
- "eval_loss": 1.2367130517959595,
134
- "eval_mse_0": 1.3900976181030273,
135
- "eval_mse_1": 1.1321898698806763,
136
- "eval_mse_2": 1.041582465171814,
137
- "eval_mse_3": 1.3829838037490845,
138
- "eval_pcc_0": 0.6720573727923348,
139
- "eval_pcc_1": 0.7216660705035336,
140
- "eval_pcc_2": 0.7232393771546507,
141
- "eval_pcc_3": 0.6877196314655709,
142
- "eval_runtime": 100.8331,
143
- "eval_samples_per_second": 24.793,
144
- "eval_steps_per_second": 3.104,
145
- "step": 2191
146
- },
147
- {
148
- "epoch": 7.99,
149
- "learning_rate": 7.337593184238552e-06,
150
- "loss": 0.8447,
151
- "step": 2500
152
- },
153
- {
154
- "epoch": 8.0,
155
- "eval_loss": 1.2162216901779175,
156
- "eval_mse_0": 1.460018277168274,
157
- "eval_mse_1": 1.0076597929000854,
158
- "eval_mse_2": 0.9815776348114014,
159
- "eval_mse_3": 1.4156315326690674,
160
- "eval_pcc_0": 0.6963019356889134,
161
- "eval_pcc_1": 0.7430064815097713,
162
- "eval_pcc_2": 0.7496560623081919,
163
- "eval_pcc_3": 0.7131421998955473,
164
- "eval_runtime": 100.7736,
165
- "eval_samples_per_second": 24.808,
166
- "eval_steps_per_second": 3.106,
167
- "step": 2504
168
- },
169
- {
170
- "epoch": 9.0,
171
- "eval_loss": 1.017881155014038,
172
- "eval_mse_0": 1.2040300369262695,
173
- "eval_mse_1": 0.8602417707443237,
174
- "eval_mse_2": 0.8572937250137329,
175
- "eval_mse_3": 1.149958848953247,
176
- "eval_pcc_0": 0.7161187909551995,
177
- "eval_pcc_1": 0.7715997989818665,
178
- "eval_pcc_2": 0.7754971497384231,
179
- "eval_pcc_3": 0.7352543400059409,
180
- "eval_runtime": 100.6372,
181
- "eval_samples_per_second": 24.842,
182
- "eval_steps_per_second": 3.11,
183
- "step": 2817
184
- },
185
- {
186
- "epoch": 9.58,
187
- "learning_rate": 6.805111821086262e-06,
188
- "loss": 0.685,
189
- "step": 3000
190
- },
191
- {
192
- "epoch": 10.0,
193
- "eval_loss": 1.2485902309417725,
194
- "eval_mse_0": 1.5102765560150146,
195
- "eval_mse_1": 1.0398504734039307,
196
- "eval_mse_2": 1.0204538106918335,
197
- "eval_mse_3": 1.4237797260284424,
198
- "eval_pcc_0": 0.7002148987459401,
199
- "eval_pcc_1": 0.7517921458553957,
200
- "eval_pcc_2": 0.7560200956358883,
201
- "eval_pcc_3": 0.7198293809052392,
202
- "eval_runtime": 100.8751,
203
- "eval_samples_per_second": 24.783,
204
- "eval_steps_per_second": 3.103,
205
- "step": 3130
206
- },
207
- {
208
- "epoch": 11.0,
209
- "eval_loss": 1.2647656202316284,
210
- "eval_mse_0": 1.4378533363342285,
211
- "eval_mse_1": 1.09242582321167,
212
- "eval_mse_2": 1.1140285730361938,
213
- "eval_mse_3": 1.4147529602050781,
214
- "eval_pcc_0": 0.7008215452758584,
215
- "eval_pcc_1": 0.7639064782042907,
216
- "eval_pcc_2": 0.7663777952981761,
217
- "eval_pcc_3": 0.7192141244692235,
218
- "eval_runtime": 100.5861,
219
- "eval_samples_per_second": 24.854,
220
- "eval_steps_per_second": 3.112,
221
- "step": 3443
222
- },
223
- {
224
- "epoch": 11.18,
225
- "learning_rate": 6.272630457933972e-06,
226
- "loss": 0.6023,
227
- "step": 3500
228
- },
229
- {
230
- "epoch": 12.0,
231
- "eval_loss": 1.5249193906784058,
232
- "eval_mse_0": 1.7945510149002075,
233
- "eval_mse_1": 1.3268375396728516,
234
- "eval_mse_2": 1.3702497482299805,
235
- "eval_mse_3": 1.608039379119873,
236
- "eval_pcc_0": 0.6972207487496517,
237
- "eval_pcc_1": 0.7669014561853221,
238
- "eval_pcc_2": 0.7691075067466909,
239
- "eval_pcc_3": 0.721238988188765,
240
- "eval_runtime": 100.8103,
241
- "eval_samples_per_second": 24.799,
242
- "eval_steps_per_second": 3.105,
243
- "step": 3756
244
- },
245
- {
246
- "epoch": 12.78,
247
- "learning_rate": 5.7401490947816826e-06,
248
- "loss": 0.4995,
249
- "step": 4000
250
- },
251
- {
252
- "epoch": 13.0,
253
- "eval_loss": 1.253173589706421,
254
- "eval_mse_0": 1.4855499267578125,
255
- "eval_mse_1": 1.0352025032043457,
256
- "eval_mse_2": 1.129489779472351,
257
- "eval_mse_3": 1.3624502420425415,
258
- "eval_pcc_0": 0.7117532688299948,
259
- "eval_pcc_1": 0.774173946684155,
260
- "eval_pcc_2": 0.7782329488765708,
261
- "eval_pcc_3": 0.7309196281189452,
262
- "eval_runtime": 100.8137,
263
- "eval_samples_per_second": 24.798,
264
- "eval_steps_per_second": 3.105,
265
- "step": 4069
266
- },
267
- {
268
- "epoch": 14.0,
269
- "eval_loss": 1.3741823434829712,
270
- "eval_mse_0": 1.5647484064102173,
271
- "eval_mse_1": 1.2162861824035645,
272
- "eval_mse_2": 1.2469784021377563,
273
- "eval_mse_3": 1.4687162637710571,
274
- "eval_pcc_0": 0.6989563197866396,
275
- "eval_pcc_1": 0.7747585936521968,
276
- "eval_pcc_2": 0.7769862273308229,
277
- "eval_pcc_3": 0.7220260621330542,
278
- "eval_runtime": 100.8527,
279
- "eval_samples_per_second": 24.789,
280
- "eval_steps_per_second": 3.104,
281
- "step": 4382
282
- },
283
- {
284
- "epoch": 14.38,
285
- "learning_rate": 5.207667731629393e-06,
286
- "loss": 0.4523,
287
- "step": 4500
288
- },
289
- {
290
- "epoch": 15.0,
291
- "eval_loss": 1.0725396871566772,
292
- "eval_mse_0": 1.2864934206008911,
293
- "eval_mse_1": 0.8737435340881348,
294
- "eval_mse_2": 0.9018136858940125,
295
- "eval_mse_3": 1.2281088829040527,
296
- "eval_pcc_0": 0.7209750758108714,
297
- "eval_pcc_1": 0.7731212421404814,
298
- "eval_pcc_2": 0.7782837759414466,
299
- "eval_pcc_3": 0.7418978897928706,
300
- "eval_runtime": 100.6545,
301
- "eval_samples_per_second": 24.837,
302
- "eval_steps_per_second": 3.11,
303
- "step": 4695
304
- },
305
- {
306
- "epoch": 15.97,
307
- "learning_rate": 4.675186368477103e-06,
308
- "loss": 0.4156,
309
- "step": 5000
310
- },
311
- {
312
- "epoch": 16.0,
313
- "eval_loss": 1.2100777626037598,
314
- "eval_mse_0": 1.4708300828933716,
315
- "eval_mse_1": 1.045762062072754,
316
- "eval_mse_2": 0.9293324947357178,
317
- "eval_mse_3": 1.3943835496902466,
318
- "eval_pcc_0": 0.710512400200325,
319
- "eval_pcc_1": 0.775940078033711,
320
- "eval_pcc_2": 0.7809762683265106,
321
- "eval_pcc_3": 0.7313685530753434,
322
- "eval_runtime": 100.4992,
323
- "eval_samples_per_second": 24.876,
324
- "eval_steps_per_second": 3.114,
325
- "step": 5008
326
- },
327
- {
328
- "epoch": 17.0,
329
- "eval_loss": 1.2254164218902588,
330
- "eval_mse_0": 1.5274760723114014,
331
- "eval_mse_1": 0.9632775187492371,
332
- "eval_mse_2": 0.9601842761039734,
333
- "eval_mse_3": 1.4507263898849487,
334
- "eval_pcc_0": 0.7090201034954653,
335
- "eval_pcc_1": 0.77499609102717,
336
- "eval_pcc_2": 0.7802451404026648,
337
- "eval_pcc_3": 0.7328554072609484,
338
- "eval_runtime": 100.6175,
339
- "eval_samples_per_second": 24.847,
340
- "eval_steps_per_second": 3.111,
341
- "step": 5321
342
- },
343
- {
344
- "epoch": 17.57,
345
- "learning_rate": 4.142705005324814e-06,
346
- "loss": 0.3597,
347
- "step": 5500
348
- },
349
- {
350
- "epoch": 18.0,
351
- "eval_loss": 1.1543495655059814,
352
- "eval_mse_0": 1.3588272333145142,
353
- "eval_mse_1": 0.9966268539428711,
354
- "eval_mse_2": 1.0238536596298218,
355
- "eval_mse_3": 1.2380930185317993,
356
- "eval_pcc_0": 0.7067521978223112,
357
- "eval_pcc_1": 0.7783125065749951,
358
- "eval_pcc_2": 0.7820830799344918,
359
- "eval_pcc_3": 0.7308957159598582,
360
- "eval_runtime": 100.9636,
361
- "eval_samples_per_second": 24.761,
362
- "eval_steps_per_second": 3.1,
363
- "step": 5634
364
- },
365
- {
366
- "epoch": 19.0,
367
- "eval_loss": 1.2339210510253906,
368
- "eval_mse_0": 1.549616813659668,
369
- "eval_mse_1": 0.9578074216842651,
370
- "eval_mse_2": 0.9888249039649963,
371
- "eval_mse_3": 1.439432978630066,
372
- "eval_pcc_0": 0.7016920379377147,
373
- "eval_pcc_1": 0.7749969143189515,
374
- "eval_pcc_2": 0.7777615745421065,
375
- "eval_pcc_3": 0.7271276424575814,
376
- "eval_runtime": 101.2163,
377
- "eval_samples_per_second": 24.7,
378
- "eval_steps_per_second": 3.092,
379
- "step": 5947
380
- },
381
- {
382
- "epoch": 19.17,
383
- "learning_rate": 3.6102236421725247e-06,
384
- "loss": 0.3666,
385
- "step": 6000
386
- },
387
- {
388
- "epoch": 20.0,
389
- "eval_loss": 1.284563422203064,
390
- "eval_mse_0": 1.512956976890564,
391
- "eval_mse_1": 1.0522581338882446,
392
- "eval_mse_2": 1.0659490823745728,
393
- "eval_mse_3": 1.5070868730545044,
394
- "eval_pcc_0": 0.700473376116245,
395
- "eval_pcc_1": 0.7696975480736717,
396
- "eval_pcc_2": 0.7731986131858355,
397
- "eval_pcc_3": 0.7213954481369491,
398
- "eval_runtime": 101.1085,
399
- "eval_samples_per_second": 24.726,
400
- "eval_steps_per_second": 3.096,
401
- "step": 6260
402
- },
403
- {
404
- "epoch": 20.77,
405
- "learning_rate": 3.0777422790202343e-06,
406
- "loss": 0.3392,
407
- "step": 6500
408
- },
409
- {
410
- "epoch": 21.0,
411
- "eval_loss": 1.4056222438812256,
412
- "eval_mse_0": 1.6199438571929932,
413
- "eval_mse_1": 1.2088689804077148,
414
- "eval_mse_2": 1.2439439296722412,
415
- "eval_mse_3": 1.5497353076934814,
416
- "eval_pcc_0": 0.6995909787379511,
417
- "eval_pcc_1": 0.7720848682005105,
418
- "eval_pcc_2": 0.7764712535309326,
419
- "eval_pcc_3": 0.7248104304088917,
420
- "eval_runtime": 101.0134,
421
- "eval_samples_per_second": 24.749,
422
- "eval_steps_per_second": 3.099,
423
- "step": 6573
424
- },
425
- {
426
- "epoch": 22.0,
427
- "eval_loss": 1.449997901916504,
428
- "eval_mse_0": 1.736374855041504,
429
- "eval_mse_1": 1.1733485460281372,
430
- "eval_mse_2": 1.2176486253738403,
431
- "eval_mse_3": 1.6726168394088745,
432
- "eval_pcc_0": 0.6930084858186102,
433
- "eval_pcc_1": 0.7724013026135311,
434
- "eval_pcc_2": 0.7754724166633662,
435
- "eval_pcc_3": 0.7196819586724444,
436
- "eval_runtime": 101.1915,
437
- "eval_samples_per_second": 24.706,
438
- "eval_steps_per_second": 3.093,
439
- "step": 6886
440
- },
441
- {
442
- "epoch": 22.36,
443
- "learning_rate": 2.5452609158679447e-06,
444
- "loss": 0.3344,
445
- "step": 7000
446
- },
447
- {
448
- "epoch": 23.0,
449
- "eval_loss": 1.352881669998169,
450
- "eval_mse_0": 1.5814332962036133,
451
- "eval_mse_1": 1.184563159942627,
452
- "eval_mse_2": 1.1705291271209717,
453
- "eval_mse_3": 1.4750003814697266,
454
- "eval_pcc_0": 0.694369288494083,
455
- "eval_pcc_1": 0.772146498540526,
456
- "eval_pcc_2": 0.7749382640309107,
457
- "eval_pcc_3": 0.721789102660383,
458
- "eval_runtime": 101.1659,
459
- "eval_samples_per_second": 24.712,
460
- "eval_steps_per_second": 3.094,
461
- "step": 7199
462
- },
463
- {
464
- "epoch": 23.96,
465
- "learning_rate": 2.012779552715655e-06,
466
- "loss": 0.2822,
467
- "step": 7500
468
- },
469
- {
470
- "epoch": 24.0,
471
- "eval_loss": 1.3014124631881714,
472
- "eval_mse_0": 1.5749812126159668,
473
- "eval_mse_1": 1.079409122467041,
474
- "eval_mse_2": 1.0792959928512573,
475
- "eval_mse_3": 1.4719666242599487,
476
- "eval_pcc_0": 0.693710854304797,
477
- "eval_pcc_1": 0.7718121846026597,
478
- "eval_pcc_2": 0.7743325438090641,
479
- "eval_pcc_3": 0.7213917030246094,
480
- "eval_runtime": 101.1516,
481
- "eval_samples_per_second": 24.715,
482
- "eval_steps_per_second": 3.094,
483
- "step": 7512
484
- },
485
- {
486
- "epoch": 25.0,
487
- "eval_loss": 1.3579597473144531,
488
- "eval_mse_0": 1.6819802522659302,
489
- "eval_mse_1": 1.0997533798217773,
490
- "eval_mse_2": 1.0862921476364136,
491
- "eval_mse_3": 1.5638113021850586,
492
- "eval_pcc_0": 0.70045389986088,
493
- "eval_pcc_1": 0.7719589220752782,
494
- "eval_pcc_2": 0.7752175306643139,
495
- "eval_pcc_3": 0.7251075024902888,
496
- "eval_runtime": 100.9651,
497
- "eval_samples_per_second": 24.761,
498
- "eval_steps_per_second": 3.1,
499
- "step": 7825
500
- },
501
- {
502
- "epoch": 25.56,
503
- "learning_rate": 1.4802981895633654e-06,
504
- "loss": 0.2661,
505
- "step": 8000
506
- },
507
- {
508
- "epoch": 26.0,
509
- "eval_loss": 1.2779024839401245,
510
- "eval_mse_0": 1.5422532558441162,
511
- "eval_mse_1": 1.067108392715454,
512
- "eval_mse_2": 1.07560396194458,
513
- "eval_mse_3": 1.4266425371170044,
514
- "eval_pcc_0": 0.7005120895064469,
515
- "eval_pcc_1": 0.7694452309708577,
516
- "eval_pcc_2": 0.770560788580687,
517
- "eval_pcc_3": 0.7239205802511122,
518
- "eval_runtime": 101.233,
519
- "eval_samples_per_second": 24.695,
520
- "eval_steps_per_second": 3.092,
521
- "step": 8138
522
- },
523
- {
524
- "epoch": 27.0,
525
- "eval_loss": 1.3012428283691406,
526
- "eval_mse_0": 1.564691424369812,
527
- "eval_mse_1": 1.0934994220733643,
528
- "eval_mse_2": 1.0779967308044434,
529
- "eval_mse_3": 1.468787670135498,
530
- "eval_pcc_0": 0.6987064020880897,
531
- "eval_pcc_1": 0.7744903175065133,
532
- "eval_pcc_2": 0.775799665255104,
533
- "eval_pcc_3": 0.7248106165784408,
534
- "eval_runtime": 101.1773,
535
- "eval_samples_per_second": 24.709,
536
- "eval_steps_per_second": 3.094,
537
- "step": 8451
538
- },
539
- {
540
- "epoch": 27.16,
541
- "learning_rate": 9.478168264110757e-07,
542
- "loss": 0.2508,
543
- "step": 8500
544
- },
545
- {
546
- "epoch": 28.0,
547
- "eval_loss": 1.2420473098754883,
548
- "eval_mse_0": 1.486934781074524,
549
- "eval_mse_1": 1.0512487888336182,
550
- "eval_mse_2": 1.0487338304519653,
551
- "eval_mse_3": 1.3812716007232666,
552
- "eval_pcc_0": 0.7011823686358516,
553
- "eval_pcc_1": 0.776348263484386,
554
- "eval_pcc_2": 0.777335498311736,
555
- "eval_pcc_3": 0.7281257734194877,
556
- "eval_runtime": 101.1356,
557
- "eval_samples_per_second": 24.719,
558
- "eval_steps_per_second": 3.095,
559
- "step": 8764
560
- },
561
- {
562
- "epoch": 28.75,
563
- "learning_rate": 4.1533546325878595e-07,
564
- "loss": 0.2409,
565
- "step": 9000
566
- },
567
- {
568
- "epoch": 29.0,
569
- "eval_loss": 1.227847695350647,
570
- "eval_mse_0": 1.4629440307617188,
571
- "eval_mse_1": 1.0204648971557617,
572
- "eval_mse_2": 1.0520468950271606,
573
- "eval_mse_3": 1.375935673713684,
574
- "eval_pcc_0": 0.7006825061450325,
575
- "eval_pcc_1": 0.7737583965098994,
576
- "eval_pcc_2": 0.7744480181106479,
577
- "eval_pcc_3": 0.727203867844303,
578
- "eval_runtime": 100.7797,
579
- "eval_samples_per_second": 24.807,
580
- "eval_steps_per_second": 3.106,
581
- "step": 9077
582
- },
583
- {
584
- "epoch": 30.0,
585
- "eval_loss": 1.2460167407989502,
586
- "eval_mse_0": 1.4599828720092773,
587
- "eval_mse_1": 1.062279224395752,
588
- "eval_mse_2": 1.073793888092041,
589
- "eval_mse_3": 1.3880120515823364,
590
- "eval_pcc_0": 0.7018509725629924,
591
- "eval_pcc_1": 0.7738516252096618,
592
- "eval_pcc_2": 0.774751106649783,
593
- "eval_pcc_3": 0.7272315825392802,
594
- "eval_runtime": 100.9156,
595
- "eval_samples_per_second": 24.773,
596
- "eval_steps_per_second": 3.102,
597
- "step": 9390
598
- },
599
- {
600
- "epoch": 30.0,
601
- "step": 9390,
602
- "total_flos": 0.0,
603
- "train_loss": 1.2372805285631532,
604
- "train_runtime": 9022.2383,
605
- "train_samples_per_second": 8.313,
606
- "train_steps_per_second": 1.041
607
- }
608
- ],
609
- "logging_steps": 500,
610
- "max_steps": 9390,
611
- "num_input_tokens_seen": 0,
612
- "num_train_epochs": 30,
613
- "save_steps": 500,
614
- "total_flos": 0.0,
615
- "train_batch_size": 8,
616
- "trial_name": null,
617
- "trial_params": null
618
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wav2vec2/freeze/02_wav2vec2-large-960-h/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a45aec78554f06f17036b9cafa66fcbd402471edb2d8c23ec1a002e05aa20d99
3
- size 4792