kurosekurose commited on
Commit
896cb83
1 Parent(s): a1dc832

End of training

Browse files
Files changed (3) hide show
  1. pytorch_model.bin +1 -1
  2. trainer_state.json +179 -254
  3. training_args.bin +1 -1
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e8848c4dbe8d243b8bcf33ca12e6a97243231e706d3728ac5cd04aefa7ba673
3
  size 379933779
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:348ab06f94fbbb9a4199388bb3e4280f3c923b86ec82c2428d19d8ce781444bd
3
  size 379933779
trainer_state.json CHANGED
@@ -1,325 +1,250 @@
1
  {
2
- "best_metric": 0.9141282439231873,
3
- "best_model_checkpoint": "kurosekurose/wav2vec2-base-EMOPIA/checkpoint-410",
4
- "epoch": 19.984,
5
- "global_step": 820,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.98,
12
- "learning_rate": 1.3666666666666668e-06,
13
- "loss": 1.4068,
14
- "step": 41
15
  },
16
  {
17
- "epoch": 0.98,
18
- "eval_accuracy": 0.30000001192092896,
19
- "eval_loss": 1.370680570602417,
20
- "eval_runtime": 40.3938,
21
- "eval_samples_per_second": 1.238,
22
- "eval_steps_per_second": 0.322,
23
- "step": 41
24
  },
25
  {
26
- "epoch": 1.98,
27
- "learning_rate": 2.7333333333333336e-06,
28
- "loss": 1.3568,
29
- "step": 82
30
  },
31
  {
32
- "epoch": 1.98,
33
- "eval_accuracy": 0.3199999928474426,
34
- "eval_loss": 1.3092886209487915,
35
- "eval_runtime": 40.4466,
36
- "eval_samples_per_second": 1.236,
37
- "eval_steps_per_second": 0.321,
38
- "step": 82
39
  },
40
  {
41
- "epoch": 2.98,
42
- "learning_rate": 4.1e-06,
43
- "loss": 1.2503,
44
- "step": 123
45
  },
46
  {
47
- "epoch": 2.98,
48
- "eval_accuracy": 0.46000000834465027,
49
- "eval_loss": 1.178250789642334,
50
- "eval_runtime": 40.4213,
51
- "eval_samples_per_second": 1.237,
52
- "eval_steps_per_second": 0.322,
53
- "step": 123
54
  },
55
  {
56
- "epoch": 3.98,
57
- "learning_rate": 5.466666666666667e-06,
58
- "loss": 1.1088,
59
- "step": 164
60
  },
61
  {
62
- "epoch": 3.98,
63
- "eval_accuracy": 0.41999998688697815,
64
- "eval_loss": 1.16064453125,
65
- "eval_runtime": 40.5701,
66
- "eval_samples_per_second": 1.232,
67
- "eval_steps_per_second": 0.32,
68
- "step": 164
69
  },
70
  {
71
- "epoch": 4.98,
72
- "learning_rate": 6.833333333333334e-06,
73
- "loss": 0.9996,
74
- "step": 205
75
  },
76
  {
77
- "epoch": 4.98,
78
- "eval_accuracy": 0.5400000214576721,
79
- "eval_loss": 1.027118444442749,
80
- "eval_runtime": 40.2938,
81
- "eval_samples_per_second": 1.241,
82
- "eval_steps_per_second": 0.323,
83
- "step": 205
84
  },
85
  {
86
- "epoch": 5.98,
87
- "learning_rate": 8.2e-06,
88
- "loss": 0.924,
89
- "step": 246
90
  },
91
  {
92
- "epoch": 5.98,
93
- "eval_accuracy": 0.5799999833106995,
94
- "eval_loss": 1.009319543838501,
95
- "eval_runtime": 40.7551,
96
- "eval_samples_per_second": 1.227,
97
- "eval_steps_per_second": 0.319,
98
- "step": 246
99
  },
100
  {
101
- "epoch": 6.98,
102
- "learning_rate": 9.566666666666668e-06,
103
- "loss": 0.8449,
104
- "step": 287
105
  },
106
  {
107
- "epoch": 6.98,
108
- "eval_accuracy": 0.5799999833106995,
109
- "eval_loss": 0.961348295211792,
110
- "eval_runtime": 40.5666,
111
- "eval_samples_per_second": 1.233,
112
- "eval_steps_per_second": 0.32,
113
- "step": 287
114
  },
115
  {
116
- "epoch": 7.98,
117
- "learning_rate": 9.461538461538463e-06,
118
- "loss": 0.7559,
119
- "step": 328
120
  },
121
  {
122
- "epoch": 7.98,
123
- "eval_accuracy": 0.6000000238418579,
124
- "eval_loss": 0.937028169631958,
125
- "eval_runtime": 40.5792,
126
- "eval_samples_per_second": 1.232,
127
- "eval_steps_per_second": 0.32,
128
- "step": 328
129
  },
130
  {
131
- "epoch": 8.98,
132
- "learning_rate": 8.673076923076924e-06,
133
- "loss": 0.7744,
134
- "step": 369
135
  },
136
  {
137
- "epoch": 8.98,
138
- "eval_accuracy": 0.5600000023841858,
139
- "eval_loss": 1.0094345808029175,
140
- "eval_runtime": 40.4365,
141
- "eval_samples_per_second": 1.237,
142
- "eval_steps_per_second": 0.321,
143
- "step": 369
144
  },
145
  {
146
- "epoch": 9.98,
147
- "learning_rate": 7.884615384615384e-06,
148
- "loss": 0.6745,
149
- "step": 410
150
  },
151
  {
152
- "epoch": 9.98,
153
- "eval_accuracy": 0.6399999856948853,
154
- "eval_loss": 0.9141282439231873,
155
- "eval_runtime": 40.471,
156
- "eval_samples_per_second": 1.235,
157
- "eval_steps_per_second": 0.321,
158
- "step": 410
159
  },
160
  {
161
- "epoch": 10.98,
162
- "learning_rate": 7.096153846153847e-06,
163
- "loss": 0.6245,
164
- "step": 451
165
  },
166
  {
167
- "epoch": 10.98,
168
- "eval_accuracy": 0.5,
169
- "eval_loss": 1.1951998472213745,
170
- "eval_runtime": 40.6687,
171
- "eval_samples_per_second": 1.229,
172
- "eval_steps_per_second": 0.32,
173
- "step": 451
174
  },
175
  {
176
- "epoch": 11.98,
177
- "learning_rate": 6.307692307692308e-06,
178
- "loss": 0.5174,
179
- "step": 492
180
  },
181
  {
182
- "epoch": 11.98,
183
- "eval_accuracy": 0.6600000262260437,
184
- "eval_loss": 0.9249220490455627,
185
- "eval_runtime": 40.488,
186
- "eval_samples_per_second": 1.235,
187
- "eval_steps_per_second": 0.321,
188
- "step": 492
189
  },
190
  {
191
- "epoch": 12.98,
192
- "learning_rate": 5.5192307692307705e-06,
193
- "loss": 0.5091,
194
- "step": 533
195
  },
196
  {
197
- "epoch": 12.98,
198
- "eval_accuracy": 0.7200000286102295,
199
- "eval_loss": 0.9292579293251038,
200
- "eval_runtime": 40.6346,
201
- "eval_samples_per_second": 1.23,
202
- "eval_steps_per_second": 0.32,
203
- "step": 533
204
  },
205
  {
206
- "epoch": 13.98,
207
- "learning_rate": 4.730769230769231e-06,
208
- "loss": 0.391,
209
- "step": 574
210
  },
211
  {
212
- "epoch": 13.98,
213
- "eval_accuracy": 0.6600000262260437,
214
- "eval_loss": 0.9355679750442505,
215
- "eval_runtime": 40.4106,
216
- "eval_samples_per_second": 1.237,
217
- "eval_steps_per_second": 0.322,
218
- "step": 574
219
  },
220
  {
221
- "epoch": 14.98,
222
- "learning_rate": 3.961538461538462e-06,
223
- "loss": 0.3689,
224
- "step": 615
225
  },
226
  {
227
- "epoch": 14.98,
228
- "eval_accuracy": 0.6200000047683716,
229
- "eval_loss": 1.0244715213775635,
230
- "eval_runtime": 40.302,
231
- "eval_samples_per_second": 1.241,
232
- "eval_steps_per_second": 0.323,
233
- "step": 615
234
  },
235
  {
236
- "epoch": 15.98,
237
- "learning_rate": 3.1730769230769233e-06,
238
- "loss": 0.2816,
239
- "step": 656
240
- },
241
- {
242
- "epoch": 15.98,
243
- "eval_accuracy": 0.6600000262260437,
244
- "eval_loss": 1.0420873165130615,
245
- "eval_runtime": 40.6297,
246
- "eval_samples_per_second": 1.231,
247
- "eval_steps_per_second": 0.32,
248
- "step": 656
249
- },
250
- {
251
- "epoch": 16.98,
252
- "learning_rate": 2.384615384615385e-06,
253
- "loss": 0.3003,
254
- "step": 697
255
- },
256
- {
257
- "epoch": 16.98,
258
- "eval_accuracy": 0.6399999856948853,
259
- "eval_loss": 1.042699933052063,
260
- "eval_runtime": 40.2488,
261
- "eval_samples_per_second": 1.242,
262
- "eval_steps_per_second": 0.323,
263
- "step": 697
264
- },
265
- {
266
- "epoch": 17.98,
267
- "learning_rate": 1.596153846153846e-06,
268
- "loss": 0.2495,
269
- "step": 738
270
- },
271
- {
272
- "epoch": 17.98,
273
- "eval_accuracy": 0.6600000262260437,
274
- "eval_loss": 1.095711350440979,
275
- "eval_runtime": 40.5759,
276
- "eval_samples_per_second": 1.232,
277
- "eval_steps_per_second": 0.32,
278
- "step": 738
279
- },
280
- {
281
- "epoch": 18.98,
282
- "learning_rate": 8.076923076923078e-07,
283
- "loss": 0.2269,
284
- "step": 779
285
- },
286
- {
287
- "epoch": 18.98,
288
- "eval_accuracy": 0.6600000262260437,
289
- "eval_loss": 1.05389404296875,
290
- "eval_runtime": 40.5913,
291
- "eval_samples_per_second": 1.232,
292
- "eval_steps_per_second": 0.32,
293
- "step": 779
294
- },
295
- {
296
- "epoch": 19.98,
297
- "learning_rate": 1.9230769230769234e-08,
298
- "loss": 0.2055,
299
- "step": 820
300
- },
301
- {
302
- "epoch": 19.98,
303
- "eval_accuracy": 0.6800000071525574,
304
- "eval_loss": 1.062558650970459,
305
- "eval_runtime": 40.7382,
306
- "eval_samples_per_second": 1.227,
307
- "eval_steps_per_second": 0.319,
308
- "step": 820
309
- },
310
- {
311
- "epoch": 19.98,
312
- "step": 820,
313
- "total_flos": 5.721848459887288e+18,
314
- "train_loss": 0.6885371266341791,
315
- "train_runtime": 22708.6522,
316
- "train_samples_per_second": 0.44,
317
- "train_steps_per_second": 0.036
318
  }
319
  ],
320
- "max_steps": 820,
321
- "num_train_epochs": 20,
322
- "total_flos": 5.721848459887288e+18,
323
  "trial_name": null,
324
  "trial_params": null
325
  }
 
1
  {
2
+ "best_metric": 0.7735137939453125,
3
+ "best_model_checkpoint": "kurosekurose/wav2vec2-base-EMOPIA/checkpoint-348",
4
+ "epoch": 14.994285714285715,
5
+ "global_step": 870,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.99,
12
+ "learning_rate": 1.9333333333333336e-06,
13
+ "loss": 1.3867,
14
+ "step": 58
15
  },
16
  {
17
+ "epoch": 0.99,
18
+ "eval_accuracy": 0.3285714387893677,
19
+ "eval_loss": 1.3517659902572632,
20
+ "eval_runtime": 46.5999,
21
+ "eval_samples_per_second": 1.502,
22
+ "eval_steps_per_second": 0.386,
23
+ "step": 58
24
  },
25
  {
26
+ "epoch": 1.99,
27
+ "learning_rate": 3.866666666666667e-06,
28
+ "loss": 1.2842,
29
+ "step": 116
30
  },
31
  {
32
+ "epoch": 1.99,
33
+ "eval_accuracy": 0.4571428596973419,
34
+ "eval_loss": 1.18719482421875,
35
+ "eval_runtime": 46.74,
36
+ "eval_samples_per_second": 1.498,
37
+ "eval_steps_per_second": 0.385,
38
+ "step": 116
39
  },
40
  {
41
+ "epoch": 2.99,
42
+ "learning_rate": 5.8e-06,
43
+ "loss": 1.0725,
44
+ "step": 174
45
  },
46
  {
47
+ "epoch": 2.99,
48
+ "eval_accuracy": 0.5571428537368774,
49
+ "eval_loss": 1.0476346015930176,
50
+ "eval_runtime": 46.9576,
51
+ "eval_samples_per_second": 1.491,
52
+ "eval_steps_per_second": 0.383,
53
+ "step": 174
54
  },
55
  {
56
+ "epoch": 3.99,
57
+ "learning_rate": 7.733333333333334e-06,
58
+ "loss": 0.9343,
59
+ "step": 232
60
  },
61
  {
62
+ "epoch": 3.99,
63
+ "eval_accuracy": 0.5714285969734192,
64
+ "eval_loss": 0.9676682949066162,
65
+ "eval_runtime": 46.68,
66
+ "eval_samples_per_second": 1.5,
67
+ "eval_steps_per_second": 0.386,
68
+ "step": 232
69
  },
70
  {
71
+ "epoch": 4.99,
72
+ "learning_rate": 9.666666666666667e-06,
73
+ "loss": 0.8053,
74
+ "step": 290
75
  },
76
  {
77
+ "epoch": 4.99,
78
+ "eval_accuracy": 0.6142857074737549,
79
+ "eval_loss": 0.9524909257888794,
80
+ "eval_runtime": 46.7102,
81
+ "eval_samples_per_second": 1.499,
82
+ "eval_steps_per_second": 0.385,
83
+ "step": 290
84
  },
85
  {
86
+ "epoch": 5.99,
87
+ "learning_rate": 9.157894736842105e-06,
88
+ "loss": 0.7895,
89
+ "step": 348
90
  },
91
  {
92
+ "epoch": 5.99,
93
+ "eval_accuracy": 0.6857143044471741,
94
+ "eval_loss": 0.7735137939453125,
95
+ "eval_runtime": 46.9896,
96
+ "eval_samples_per_second": 1.49,
97
+ "eval_steps_per_second": 0.383,
98
+ "step": 348
99
  },
100
  {
101
+ "epoch": 6.99,
102
+ "learning_rate": 8.140350877192983e-06,
103
+ "loss": 0.6867,
104
+ "step": 406
105
  },
106
  {
107
+ "epoch": 6.99,
108
+ "eval_accuracy": 0.6428571343421936,
109
+ "eval_loss": 0.8555552363395691,
110
+ "eval_runtime": 46.718,
111
+ "eval_samples_per_second": 1.498,
112
+ "eval_steps_per_second": 0.385,
113
+ "step": 406
114
  },
115
  {
116
+ "epoch": 7.99,
117
+ "learning_rate": 7.140350877192983e-06,
118
+ "loss": 0.6218,
119
+ "step": 464
120
  },
121
  {
122
+ "epoch": 7.99,
123
+ "eval_accuracy": 0.6714285612106323,
124
+ "eval_loss": 0.8454030156135559,
125
+ "eval_runtime": 46.4466,
126
+ "eval_samples_per_second": 1.507,
127
+ "eval_steps_per_second": 0.388,
128
+ "step": 464
129
  },
130
  {
131
+ "epoch": 8.99,
132
+ "learning_rate": 6.140350877192983e-06,
133
+ "loss": 0.558,
134
+ "step": 522
135
  },
136
  {
137
+ "epoch": 8.99,
138
+ "eval_accuracy": 0.6571428775787354,
139
+ "eval_loss": 0.8404667973518372,
140
+ "eval_runtime": 46.7611,
141
+ "eval_samples_per_second": 1.497,
142
+ "eval_steps_per_second": 0.385,
143
+ "step": 522
144
  },
145
  {
146
+ "epoch": 9.99,
147
+ "learning_rate": 5.12280701754386e-06,
148
+ "loss": 0.5033,
149
+ "step": 580
150
  },
151
  {
152
+ "epoch": 9.99,
153
+ "eval_accuracy": 0.6285714507102966,
154
+ "eval_loss": 1.0190438032150269,
155
+ "eval_runtime": 47.1353,
156
+ "eval_samples_per_second": 1.485,
157
+ "eval_steps_per_second": 0.382,
158
+ "step": 580
159
  },
160
  {
161
+ "epoch": 10.99,
162
+ "learning_rate": 4.105263157894737e-06,
163
+ "loss": 0.4403,
164
+ "step": 638
165
  },
166
  {
167
+ "epoch": 10.99,
168
+ "eval_accuracy": 0.699999988079071,
169
+ "eval_loss": 0.82489013671875,
170
+ "eval_runtime": 46.7633,
171
+ "eval_samples_per_second": 1.497,
172
+ "eval_steps_per_second": 0.385,
173
+ "step": 638
174
  },
175
  {
176
+ "epoch": 11.99,
177
+ "learning_rate": 3.0877192982456146e-06,
178
+ "loss": 0.3995,
179
+ "step": 696
180
  },
181
  {
182
+ "epoch": 11.99,
183
+ "eval_accuracy": 0.7142857313156128,
184
+ "eval_loss": 0.8996997475624084,
185
+ "eval_runtime": 46.7333,
186
+ "eval_samples_per_second": 1.498,
187
+ "eval_steps_per_second": 0.385,
188
+ "step": 696
189
  },
190
  {
191
+ "epoch": 12.99,
192
+ "learning_rate": 2.0701754385964913e-06,
193
+ "loss": 0.3534,
194
+ "step": 754
195
  },
196
  {
197
+ "epoch": 12.99,
198
+ "eval_accuracy": 0.699999988079071,
199
+ "eval_loss": 0.9177280068397522,
200
+ "eval_runtime": 46.7502,
201
+ "eval_samples_per_second": 1.497,
202
+ "eval_steps_per_second": 0.385,
203
+ "step": 754
204
  },
205
  {
206
+ "epoch": 13.99,
207
+ "learning_rate": 1.0526315789473685e-06,
208
+ "loss": 0.3023,
209
+ "step": 812
210
  },
211
  {
212
+ "epoch": 13.99,
213
+ "eval_accuracy": 0.6571428775787354,
214
+ "eval_loss": 0.9544177651405334,
215
+ "eval_runtime": 46.7592,
216
+ "eval_samples_per_second": 1.497,
217
+ "eval_steps_per_second": 0.385,
218
+ "step": 812
219
  },
220
  {
221
+ "epoch": 14.99,
222
+ "learning_rate": 3.508771929824562e-08,
223
+ "loss": 0.2752,
224
+ "step": 870
225
  },
226
  {
227
+ "epoch": 14.99,
228
+ "eval_accuracy": 0.699999988079071,
229
+ "eval_loss": 0.9346058964729309,
230
+ "eval_runtime": 46.4397,
231
+ "eval_samples_per_second": 1.507,
232
+ "eval_steps_per_second": 0.388,
233
+ "step": 870
234
  },
235
  {
236
+ "epoch": 14.99,
237
+ "step": 870,
238
+ "total_flos": 4.99147314409986e+18,
239
+ "train_loss": 0.6941862314596944,
240
+ "train_runtime": 20182.4464,
241
+ "train_samples_per_second": 0.52,
242
+ "train_steps_per_second": 0.043
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
243
  }
244
  ],
245
+ "max_steps": 870,
246
+ "num_train_epochs": 15,
247
+ "total_flos": 4.99147314409986e+18,
248
  "trial_name": null,
249
  "trial_params": null
250
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ccf48c4a0d78c84d927241619accb6e146ed3470c5f78ef19ec300caa18ccaa
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:129989de89a833eb0c8d9e960516ce76d7fddab79482e76bde4c7c1f16fb577e
3
  size 3055