yeshpanovrustem commited on
Commit
9163f01
·
1 Parent(s): 2b92869

Delete trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +0 -160
trainer_state.json DELETED
@@ -1,160 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
- "global_step": 2330,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 1.0,
12
- "eval_accuracy": 0.8702409035670884,
13
- "eval_f1": 0.2995999407319603,
14
- "eval_loss": 0.5389052033424377,
15
- "eval_precision": 0.33331959612610756,
16
- "eval_recall": 0.27207589060450094,
17
- "eval_runtime": 14.1196,
18
- "eval_samples_per_second": 1054.99,
19
- "eval_steps_per_second": 2.125,
20
- "step": 233
21
- },
22
- {
23
- "epoch": 2.0,
24
- "eval_accuracy": 0.9681749946386446,
25
- "eval_f1": 0.8514915583419936,
26
- "eval_loss": 0.12146873772144318,
27
- "eval_precision": 0.8626164998274076,
28
- "eval_recall": 0.8406499142193965,
29
- "eval_runtime": 15.0925,
30
- "eval_samples_per_second": 986.983,
31
- "eval_steps_per_second": 1.988,
32
- "step": 466
33
- },
34
- {
35
- "epoch": 2.15,
36
- "learning_rate": 6.25e-06,
37
- "loss": 1.2635,
38
- "step": 500
39
- },
40
- {
41
- "epoch": 3.0,
42
- "eval_accuracy": 0.9790478232897276,
43
- "eval_f1": 0.9141998345125719,
44
- "eval_loss": 0.0771816298365593,
45
- "eval_precision": 0.9178421266784212,
46
- "eval_recall": 0.9105863356544556,
47
- "eval_runtime": 14.0091,
48
- "eval_samples_per_second": 1063.307,
49
- "eval_steps_per_second": 2.141,
50
- "step": 699
51
- },
52
- {
53
- "epoch": 4.0,
54
- "eval_accuracy": 0.98271141611266,
55
- "eval_f1": 0.9309382867251821,
56
- "eval_loss": 0.06554248929023743,
57
- "eval_precision": 0.9416055882454148,
58
- "eval_recall": 0.9205099740976217,
59
- "eval_runtime": 14.0197,
60
- "eval_samples_per_second": 1062.501,
61
- "eval_steps_per_second": 2.14,
62
- "step": 932
63
- },
64
- {
65
- "epoch": 4.29,
66
- "learning_rate": 8.69281045751634e-06,
67
- "loss": 0.0906,
68
- "step": 1000
69
- },
70
- {
71
- "epoch": 5.0,
72
- "eval_accuracy": 0.984880977911216,
73
- "eval_f1": 0.9419223941161552,
74
- "eval_loss": 0.06115253269672394,
75
- "eval_precision": 0.9468692637160921,
76
- "eval_recall": 0.9370269452013321,
77
- "eval_runtime": 14.0288,
78
- "eval_samples_per_second": 1061.817,
79
- "eval_steps_per_second": 2.138,
80
- "step": 1165
81
- },
82
- {
83
- "epoch": 6.0,
84
- "eval_accuracy": 0.9843269711916506,
85
- "eval_f1": 0.9446501919062689,
86
- "eval_loss": 0.062205445021390915,
87
- "eval_precision": 0.9454459682582471,
88
- "eval_recall": 0.9438557540283244,
89
- "eval_runtime": 14.4851,
90
- "eval_samples_per_second": 1028.367,
91
- "eval_steps_per_second": 2.071,
92
- "step": 1398
93
- },
94
- {
95
- "epoch": 6.44,
96
- "learning_rate": 5.4248366013071894e-06,
97
- "loss": 0.0429,
98
- "step": 1500
99
- },
100
- {
101
- "epoch": 7.0,
102
- "eval_accuracy": 0.9854850239473872,
103
- "eval_f1": 0.9466268938436389,
104
- "eval_loss": 0.06088804826140404,
105
- "eval_precision": 0.9484971293481932,
106
- "eval_recall": 0.9447640192417668,
107
- "eval_runtime": 14.327,
108
- "eval_samples_per_second": 1039.716,
109
- "eval_steps_per_second": 2.094,
110
- "step": 1631
111
- },
112
- {
113
- "epoch": 8.0,
114
- "eval_accuracy": 0.9853885195510759,
115
- "eval_f1": 0.9475256832068758,
116
- "eval_loss": 0.06388872861862183,
117
- "eval_precision": 0.9456525381135868,
118
- "eval_recall": 0.9494062636660275,
119
- "eval_runtime": 14.5864,
120
- "eval_samples_per_second": 1021.225,
121
- "eval_steps_per_second": 2.057,
122
- "step": 1864
123
- },
124
- {
125
- "epoch": 8.58,
126
- "learning_rate": 2.1568627450980393e-06,
127
- "loss": 0.0265,
128
- "step": 2000
129
- },
130
- {
131
- "epoch": 9.0,
132
- "eval_accuracy": 0.9858710415326328,
133
- "eval_f1": 0.9485348353785288,
134
- "eval_loss": 0.06375858187675476,
135
- "eval_precision": 0.9453968253968253,
136
- "eval_recall": 0.9516937464258082,
137
- "eval_runtime": 14.1094,
138
- "eval_samples_per_second": 1055.751,
139
- "eval_steps_per_second": 2.126,
140
- "step": 2097
141
- },
142
- {
143
- "epoch": 10.0,
144
- "eval_accuracy": 0.9859925655872471,
145
- "eval_f1": 0.949012494961709,
146
- "eval_loss": 0.06480085104703903,
147
- "eval_precision": 0.9475802394607103,
148
- "eval_recall": 0.9504490866888687,
149
- "eval_runtime": 13.7245,
150
- "eval_samples_per_second": 1085.359,
151
- "eval_steps_per_second": 2.186,
152
- "step": 2330
153
- }
154
- ],
155
- "max_steps": 2330,
156
- "num_train_epochs": 10,
157
- "total_flos": 1.6349634872247114e+17,
158
- "trial_name": null,
159
- "trial_params": null
160
- }