File size: 12,742 Bytes
2607071
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
{
  "best_metric": 1.0679948329925537,
  "best_model_checkpoint": "asd_pronunciation_w2v_xlsr-300m/checkpoint-99",
  "epoch": 49.977777777777774,
  "global_step": 550,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.98,
      "eval_accuracy": 0.33144742250442505,
      "eval_loss": 1.5670545101165771,
      "eval_runtime": 62.8235,
      "eval_samples_per_second": 33.761,
      "eval_steps_per_second": 1.066,
      "step": 11
    },
    {
      "epoch": 1.98,
      "eval_accuracy": 0.39273926615715027,
      "eval_loss": 1.3582004308700562,
      "eval_runtime": 62.2914,
      "eval_samples_per_second": 34.05,
      "eval_steps_per_second": 1.076,
      "step": 22
    },
    {
      "epoch": 2.98,
      "eval_accuracy": 0.380952388048172,
      "eval_loss": 1.3765946626663208,
      "eval_runtime": 63.9238,
      "eval_samples_per_second": 33.18,
      "eval_steps_per_second": 1.048,
      "step": 33
    },
    {
      "epoch": 3.98,
      "eval_accuracy": 0.4186704456806183,
      "eval_loss": 1.3837833404541016,
      "eval_runtime": 63.6397,
      "eval_samples_per_second": 33.328,
      "eval_steps_per_second": 1.053,
      "step": 44
    },
    {
      "epoch": 4.98,
      "eval_accuracy": 0.3663366436958313,
      "eval_loss": 1.5986249446868896,
      "eval_runtime": 63.7365,
      "eval_samples_per_second": 33.278,
      "eval_steps_per_second": 1.051,
      "step": 55
    },
    {
      "epoch": 5.98,
      "eval_accuracy": 0.42904290556907654,
      "eval_loss": 1.8822154998779297,
      "eval_runtime": 63.6958,
      "eval_samples_per_second": 33.299,
      "eval_steps_per_second": 1.052,
      "step": 66
    },
    {
      "epoch": 6.98,
      "eval_accuracy": 0.34983497858047485,
      "eval_loss": 1.865776538848877,
      "eval_runtime": 63.1847,
      "eval_samples_per_second": 33.568,
      "eval_steps_per_second": 1.06,
      "step": 77
    },
    {
      "epoch": 7.98,
      "eval_accuracy": 0.4502592980861664,
      "eval_loss": 1.966166377067566,
      "eval_runtime": 63.6503,
      "eval_samples_per_second": 33.323,
      "eval_steps_per_second": 1.053,
      "step": 88
    },
    {
      "epoch": 8.98,
      "eval_accuracy": 0.6855257153511047,
      "eval_loss": 1.0679948329925537,
      "eval_runtime": 63.1701,
      "eval_samples_per_second": 33.576,
      "eval_steps_per_second": 1.061,
      "step": 99
    },
    {
      "epoch": 9.98,
      "eval_accuracy": 0.6539368033409119,
      "eval_loss": 1.1463075876235962,
      "eval_runtime": 63.3309,
      "eval_samples_per_second": 33.491,
      "eval_steps_per_second": 1.058,
      "step": 110
    },
    {
      "epoch": 10.98,
      "eval_accuracy": 0.7157001495361328,
      "eval_loss": 1.1053473949432373,
      "eval_runtime": 63.7039,
      "eval_samples_per_second": 33.295,
      "eval_steps_per_second": 1.052,
      "step": 121
    },
    {
      "epoch": 11.98,
      "eval_accuracy": 0.5836869478225708,
      "eval_loss": 1.6300278902053833,
      "eval_runtime": 63.4359,
      "eval_samples_per_second": 33.435,
      "eval_steps_per_second": 1.056,
      "step": 132
    },
    {
      "epoch": 12.98,
      "eval_accuracy": 0.697312593460083,
      "eval_loss": 1.190132975578308,
      "eval_runtime": 62.8623,
      "eval_samples_per_second": 33.74,
      "eval_steps_per_second": 1.066,
      "step": 143
    },
    {
      "epoch": 13.98,
      "eval_accuracy": 0.5761433243751526,
      "eval_loss": 1.677795171737671,
      "eval_runtime": 63.1508,
      "eval_samples_per_second": 33.586,
      "eval_steps_per_second": 1.061,
      "step": 154
    },
    {
      "epoch": 14.98,
      "eval_accuracy": 0.7072135806083679,
      "eval_loss": 1.2646026611328125,
      "eval_runtime": 64.2737,
      "eval_samples_per_second": 33.0,
      "eval_steps_per_second": 1.042,
      "step": 165
    },
    {
      "epoch": 15.98,
      "eval_accuracy": 0.5535125136375427,
      "eval_loss": 1.866857647895813,
      "eval_runtime": 63.6272,
      "eval_samples_per_second": 33.335,
      "eval_steps_per_second": 1.053,
      "step": 176
    },
    {
      "epoch": 16.98,
      "eval_accuracy": 0.5700141191482544,
      "eval_loss": 1.911484956741333,
      "eval_runtime": 63.0574,
      "eval_samples_per_second": 33.636,
      "eval_steps_per_second": 1.063,
      "step": 187
    },
    {
      "epoch": 17.98,
      "eval_accuracy": 0.608203649520874,
      "eval_loss": 1.748372197151184,
      "eval_runtime": 63.9869,
      "eval_samples_per_second": 33.147,
      "eval_steps_per_second": 1.047,
      "step": 198
    },
    {
      "epoch": 18.98,
      "eval_accuracy": 0.6209335327148438,
      "eval_loss": 1.736160159111023,
      "eval_runtime": 63.5615,
      "eval_samples_per_second": 33.369,
      "eval_steps_per_second": 1.054,
      "step": 209
    },
    {
      "epoch": 19.98,
      "eval_accuracy": 0.5535125136375427,
      "eval_loss": 2.0504212379455566,
      "eval_runtime": 63.6231,
      "eval_samples_per_second": 33.337,
      "eval_steps_per_second": 1.053,
      "step": 220
    },
    {
      "epoch": 20.98,
      "eval_accuracy": 0.6520509123802185,
      "eval_loss": 1.6594103574752808,
      "eval_runtime": 63.6587,
      "eval_samples_per_second": 33.318,
      "eval_steps_per_second": 1.052,
      "step": 231
    },
    {
      "epoch": 21.98,
      "eval_accuracy": 0.6779820919036865,
      "eval_loss": 1.5675663948059082,
      "eval_runtime": 64.5637,
      "eval_samples_per_second": 32.851,
      "eval_steps_per_second": 1.038,
      "step": 242
    },
    {
      "epoch": 22.98,
      "eval_accuracy": 0.6737387776374817,
      "eval_loss": 1.6316275596618652,
      "eval_runtime": 63.4257,
      "eval_samples_per_second": 33.441,
      "eval_steps_per_second": 1.056,
      "step": 253
    },
    {
      "epoch": 23.98,
      "eval_accuracy": 0.5983026623725891,
      "eval_loss": 1.9427396059036255,
      "eval_runtime": 63.6629,
      "eval_samples_per_second": 33.316,
      "eval_steps_per_second": 1.052,
      "step": 264
    },
    {
      "epoch": 24.98,
      "eval_accuracy": 0.6619518995285034,
      "eval_loss": 1.7251100540161133,
      "eval_runtime": 63.8986,
      "eval_samples_per_second": 33.193,
      "eval_steps_per_second": 1.049,
      "step": 275
    },
    {
      "epoch": 25.98,
      "eval_accuracy": 0.7133427858352661,
      "eval_loss": 1.4861173629760742,
      "eval_runtime": 63.105,
      "eval_samples_per_second": 33.611,
      "eval_steps_per_second": 1.062,
      "step": 286
    },
    {
      "epoch": 26.98,
      "eval_accuracy": 0.6388496160507202,
      "eval_loss": 1.8551920652389526,
      "eval_runtime": 63.3692,
      "eval_samples_per_second": 33.471,
      "eval_steps_per_second": 1.057,
      "step": 297
    },
    {
      "epoch": 27.98,
      "eval_accuracy": 0.6218764781951904,
      "eval_loss": 1.9755550622940063,
      "eval_runtime": 63.7438,
      "eval_samples_per_second": 33.274,
      "eval_steps_per_second": 1.051,
      "step": 308
    },
    {
      "epoch": 28.98,
      "eval_accuracy": 0.5879302024841309,
      "eval_loss": 2.2480831146240234,
      "eval_runtime": 62.9459,
      "eval_samples_per_second": 33.696,
      "eval_steps_per_second": 1.064,
      "step": 319
    },
    {
      "epoch": 29.98,
      "eval_accuracy": 0.6176331639289856,
      "eval_loss": 1.9868534803390503,
      "eval_runtime": 63.9115,
      "eval_samples_per_second": 33.187,
      "eval_steps_per_second": 1.048,
      "step": 330
    },
    {
      "epoch": 30.98,
      "eval_accuracy": 0.6991984844207764,
      "eval_loss": 1.6001139879226685,
      "eval_runtime": 62.9701,
      "eval_samples_per_second": 33.683,
      "eval_steps_per_second": 1.064,
      "step": 341
    },
    {
      "epoch": 31.98,
      "eval_accuracy": 0.6562942266464233,
      "eval_loss": 1.80760657787323,
      "eval_runtime": 64.5355,
      "eval_samples_per_second": 32.866,
      "eval_steps_per_second": 1.038,
      "step": 352
    },
    {
      "epoch": 32.98,
      "eval_accuracy": 0.6539368033409119,
      "eval_loss": 1.8803389072418213,
      "eval_runtime": 63.8068,
      "eval_samples_per_second": 33.241,
      "eval_steps_per_second": 1.05,
      "step": 363
    },
    {
      "epoch": 33.98,
      "eval_accuracy": 0.6308345198631287,
      "eval_loss": 1.9857879877090454,
      "eval_runtime": 63.5545,
      "eval_samples_per_second": 33.373,
      "eval_steps_per_second": 1.054,
      "step": 374
    },
    {
      "epoch": 34.98,
      "eval_accuracy": 0.6228194236755371,
      "eval_loss": 2.016218900680542,
      "eval_runtime": 63.1093,
      "eval_samples_per_second": 33.608,
      "eval_steps_per_second": 1.062,
      "step": 385
    },
    {
      "epoch": 35.98,
      "eval_accuracy": 0.6247053146362305,
      "eval_loss": 1.9806338548660278,
      "eval_runtime": 63.643,
      "eval_samples_per_second": 33.327,
      "eval_steps_per_second": 1.053,
      "step": 396
    },
    {
      "epoch": 36.98,
      "eval_accuracy": 0.6148043274879456,
      "eval_loss": 2.0684027671813965,
      "eval_runtime": 63.1391,
      "eval_samples_per_second": 33.593,
      "eval_steps_per_second": 1.061,
      "step": 407
    },
    {
      "epoch": 37.98,
      "eval_accuracy": 0.6826968193054199,
      "eval_loss": 1.7208051681518555,
      "eval_runtime": 63.3764,
      "eval_samples_per_second": 33.467,
      "eval_steps_per_second": 1.057,
      "step": 418
    },
    {
      "epoch": 38.98,
      "eval_accuracy": 0.6676096320152283,
      "eval_loss": 1.7736769914627075,
      "eval_runtime": 63.0716,
      "eval_samples_per_second": 33.628,
      "eval_steps_per_second": 1.062,
      "step": 429
    },
    {
      "epoch": 39.98,
      "eval_accuracy": 0.6940122842788696,
      "eval_loss": 1.7225761413574219,
      "eval_runtime": 64.0078,
      "eval_samples_per_second": 33.137,
      "eval_steps_per_second": 1.047,
      "step": 440
    },
    {
      "epoch": 40.98,
      "eval_accuracy": 0.606789231300354,
      "eval_loss": 2.0414962768554688,
      "eval_runtime": 63.4689,
      "eval_samples_per_second": 33.418,
      "eval_steps_per_second": 1.056,
      "step": 451
    },
    {
      "epoch": 41.98,
      "eval_accuracy": 0.6214050054550171,
      "eval_loss": 2.019111394882202,
      "eval_runtime": 63.5976,
      "eval_samples_per_second": 33.35,
      "eval_steps_per_second": 1.053,
      "step": 462
    },
    {
      "epoch": 42.98,
      "eval_accuracy": 0.6379066705703735,
      "eval_loss": 1.947460412979126,
      "eval_runtime": 63.6957,
      "eval_samples_per_second": 33.299,
      "eval_steps_per_second": 1.052,
      "step": 473
    },
    {
      "epoch": 43.98,
      "eval_accuracy": 0.669966995716095,
      "eval_loss": 1.8389097452163696,
      "eval_runtime": 64.1144,
      "eval_samples_per_second": 33.081,
      "eval_steps_per_second": 1.045,
      "step": 484
    },
    {
      "epoch": 44.98,
      "eval_accuracy": 0.6666666865348816,
      "eval_loss": 1.814638376235962,
      "eval_runtime": 63.7225,
      "eval_samples_per_second": 33.285,
      "eval_steps_per_second": 1.051,
      "step": 495
    },
    {
      "epoch": 45.44,
      "learning_rate": 3.03030303030303e-05,
      "loss": 0.3177,
      "step": 500
    },
    {
      "epoch": 45.98,
      "eval_accuracy": 0.6718528866767883,
      "eval_loss": 1.79548978805542,
      "eval_runtime": 63.2169,
      "eval_samples_per_second": 33.551,
      "eval_steps_per_second": 1.06,
      "step": 506
    },
    {
      "epoch": 46.98,
      "eval_accuracy": 0.65865159034729,
      "eval_loss": 1.9061682224273682,
      "eval_runtime": 64.47,
      "eval_samples_per_second": 32.899,
      "eval_steps_per_second": 1.039,
      "step": 517
    },
    {
      "epoch": 47.98,
      "eval_accuracy": 0.6643092632293701,
      "eval_loss": 1.8877029418945312,
      "eval_runtime": 63.3351,
      "eval_samples_per_second": 33.489,
      "eval_steps_per_second": 1.058,
      "step": 528
    },
    {
      "epoch": 48.98,
      "eval_accuracy": 0.6694955229759216,
      "eval_loss": 1.8578468561172485,
      "eval_runtime": 63.6561,
      "eval_samples_per_second": 33.32,
      "eval_steps_per_second": 1.053,
      "step": 539
    },
    {
      "epoch": 49.98,
      "eval_accuracy": 0.6690240502357483,
      "eval_loss": 1.8590630292892456,
      "eval_runtime": 62.2809,
      "eval_samples_per_second": 34.055,
      "eval_steps_per_second": 1.076,
      "step": 550
    }
  ],
  "max_steps": 550,
  "num_train_epochs": 50,
  "total_flos": 1.6031529967362595e+20,
  "trial_name": null,
  "trial_params": null
}