File size: 12,543 Bytes
ab197ff
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
{
  "best_metric": 0.30745795369148254,
  "best_model_checkpoint": "asd_pronunciation_w2v_xlsr-reg/checkpoint-99",
  "epoch": 49.977777777777774,
  "global_step": 550,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.98,
      "eval_loss": 0.8269791603088379,
      "eval_mse": 0.8274638056755066,
      "eval_runtime": 67.3404,
      "eval_samples_per_second": 31.497,
      "eval_steps_per_second": 0.995,
      "step": 11
    },
    {
      "epoch": 1.98,
      "eval_loss": 0.4631172716617584,
      "eval_mse": 0.46300947666168213,
      "eval_runtime": 67.2163,
      "eval_samples_per_second": 31.555,
      "eval_steps_per_second": 0.997,
      "step": 22
    },
    {
      "epoch": 2.98,
      "eval_loss": 0.351409912109375,
      "eval_mse": 0.3515050709247589,
      "eval_runtime": 67.5563,
      "eval_samples_per_second": 31.396,
      "eval_steps_per_second": 0.992,
      "step": 33
    },
    {
      "epoch": 3.98,
      "eval_loss": 0.3585782051086426,
      "eval_mse": 0.35852691531181335,
      "eval_runtime": 69.7976,
      "eval_samples_per_second": 30.388,
      "eval_steps_per_second": 0.96,
      "step": 44
    },
    {
      "epoch": 4.98,
      "eval_loss": 0.4412296712398529,
      "eval_mse": 0.4412075877189636,
      "eval_runtime": 79.1138,
      "eval_samples_per_second": 26.809,
      "eval_steps_per_second": 0.847,
      "step": 55
    },
    {
      "epoch": 5.98,
      "eval_loss": 0.430486798286438,
      "eval_mse": 0.43049314618110657,
      "eval_runtime": 72.5547,
      "eval_samples_per_second": 29.233,
      "eval_steps_per_second": 0.923,
      "step": 66
    },
    {
      "epoch": 6.98,
      "eval_loss": 0.42916765809059143,
      "eval_mse": 0.4291659891605377,
      "eval_runtime": 95.5528,
      "eval_samples_per_second": 22.197,
      "eval_steps_per_second": 0.701,
      "step": 77
    },
    {
      "epoch": 7.98,
      "eval_loss": 0.4343053996562958,
      "eval_mse": 0.43428245186805725,
      "eval_runtime": 66.5007,
      "eval_samples_per_second": 31.894,
      "eval_steps_per_second": 1.008,
      "step": 88
    },
    {
      "epoch": 8.98,
      "eval_loss": 0.30745795369148254,
      "eval_mse": 0.3074318766593933,
      "eval_runtime": 66.2359,
      "eval_samples_per_second": 32.022,
      "eval_steps_per_second": 1.012,
      "step": 99
    },
    {
      "epoch": 9.98,
      "eval_loss": 0.42939332127571106,
      "eval_mse": 0.4293690323829651,
      "eval_runtime": 66.3865,
      "eval_samples_per_second": 31.949,
      "eval_steps_per_second": 1.009,
      "step": 110
    },
    {
      "epoch": 10.98,
      "eval_loss": 0.3727492094039917,
      "eval_mse": 0.3727482855319977,
      "eval_runtime": 66.8857,
      "eval_samples_per_second": 31.711,
      "eval_steps_per_second": 1.002,
      "step": 121
    },
    {
      "epoch": 11.98,
      "eval_loss": 0.42278197407722473,
      "eval_mse": 0.42277276515960693,
      "eval_runtime": 65.5197,
      "eval_samples_per_second": 32.372,
      "eval_steps_per_second": 1.023,
      "step": 132
    },
    {
      "epoch": 12.98,
      "eval_loss": 0.4014572203159332,
      "eval_mse": 0.40141549706459045,
      "eval_runtime": 65.6627,
      "eval_samples_per_second": 32.301,
      "eval_steps_per_second": 1.02,
      "step": 143
    },
    {
      "epoch": 13.98,
      "eval_loss": 0.37818050384521484,
      "eval_mse": 0.37818947434425354,
      "eval_runtime": 66.0031,
      "eval_samples_per_second": 32.135,
      "eval_steps_per_second": 1.015,
      "step": 154
    },
    {
      "epoch": 14.98,
      "eval_loss": 0.4358225166797638,
      "eval_mse": 0.43578916788101196,
      "eval_runtime": 65.7571,
      "eval_samples_per_second": 32.255,
      "eval_steps_per_second": 1.019,
      "step": 165
    },
    {
      "epoch": 15.98,
      "eval_loss": 0.36039263010025024,
      "eval_mse": 0.3603877127170563,
      "eval_runtime": 67.6323,
      "eval_samples_per_second": 31.361,
      "eval_steps_per_second": 0.991,
      "step": 176
    },
    {
      "epoch": 16.98,
      "eval_loss": 0.40446653962135315,
      "eval_mse": 0.40447959303855896,
      "eval_runtime": 66.1021,
      "eval_samples_per_second": 32.087,
      "eval_steps_per_second": 1.014,
      "step": 187
    },
    {
      "epoch": 17.98,
      "eval_loss": 0.3638509213924408,
      "eval_mse": 0.3638397455215454,
      "eval_runtime": 66.1765,
      "eval_samples_per_second": 32.051,
      "eval_steps_per_second": 1.012,
      "step": 198
    },
    {
      "epoch": 18.98,
      "eval_loss": 0.4001483619213104,
      "eval_mse": 0.400104284286499,
      "eval_runtime": 66.5235,
      "eval_samples_per_second": 31.883,
      "eval_steps_per_second": 1.007,
      "step": 209
    },
    {
      "epoch": 19.98,
      "eval_loss": 0.3836788535118103,
      "eval_mse": 0.38362112641334534,
      "eval_runtime": 65.5397,
      "eval_samples_per_second": 32.362,
      "eval_steps_per_second": 1.022,
      "step": 220
    },
    {
      "epoch": 20.98,
      "eval_loss": 0.3813478350639343,
      "eval_mse": 0.3813202679157257,
      "eval_runtime": 67.0847,
      "eval_samples_per_second": 31.617,
      "eval_steps_per_second": 0.999,
      "step": 231
    },
    {
      "epoch": 21.98,
      "eval_loss": 0.3911483883857727,
      "eval_mse": 0.39113306999206543,
      "eval_runtime": 66.4329,
      "eval_samples_per_second": 31.927,
      "eval_steps_per_second": 1.009,
      "step": 242
    },
    {
      "epoch": 22.98,
      "eval_loss": 0.43994417786598206,
      "eval_mse": 0.4399244487285614,
      "eval_runtime": 66.1358,
      "eval_samples_per_second": 32.07,
      "eval_steps_per_second": 1.013,
      "step": 253
    },
    {
      "epoch": 23.98,
      "eval_loss": 0.4228975772857666,
      "eval_mse": 0.42288002371788025,
      "eval_runtime": 66.6907,
      "eval_samples_per_second": 31.804,
      "eval_steps_per_second": 1.005,
      "step": 264
    },
    {
      "epoch": 24.98,
      "eval_loss": 0.4192221462726593,
      "eval_mse": 0.4191807508468628,
      "eval_runtime": 65.8241,
      "eval_samples_per_second": 32.222,
      "eval_steps_per_second": 1.018,
      "step": 275
    },
    {
      "epoch": 25.98,
      "eval_loss": 0.40975797176361084,
      "eval_mse": 0.4097472131252289,
      "eval_runtime": 67.5766,
      "eval_samples_per_second": 31.387,
      "eval_steps_per_second": 0.991,
      "step": 286
    },
    {
      "epoch": 26.98,
      "eval_loss": 0.3760901093482971,
      "eval_mse": 0.37607377767562866,
      "eval_runtime": 65.9157,
      "eval_samples_per_second": 32.177,
      "eval_steps_per_second": 1.016,
      "step": 297
    },
    {
      "epoch": 27.98,
      "eval_loss": 0.389096200466156,
      "eval_mse": 0.3890584111213684,
      "eval_runtime": 65.956,
      "eval_samples_per_second": 32.158,
      "eval_steps_per_second": 1.016,
      "step": 308
    },
    {
      "epoch": 28.98,
      "eval_loss": 0.4243176579475403,
      "eval_mse": 0.4242975115776062,
      "eval_runtime": 66.4794,
      "eval_samples_per_second": 31.905,
      "eval_steps_per_second": 1.008,
      "step": 319
    },
    {
      "epoch": 29.98,
      "eval_loss": 0.4235914349555969,
      "eval_mse": 0.4235744774341583,
      "eval_runtime": 66.2277,
      "eval_samples_per_second": 32.026,
      "eval_steps_per_second": 1.012,
      "step": 330
    },
    {
      "epoch": 30.98,
      "eval_loss": 0.4235081076622009,
      "eval_mse": 0.42347782850265503,
      "eval_runtime": 66.6381,
      "eval_samples_per_second": 31.829,
      "eval_steps_per_second": 1.005,
      "step": 341
    },
    {
      "epoch": 31.98,
      "eval_loss": 0.4236636757850647,
      "eval_mse": 0.4236546456813812,
      "eval_runtime": 65.6032,
      "eval_samples_per_second": 32.331,
      "eval_steps_per_second": 1.021,
      "step": 352
    },
    {
      "epoch": 32.98,
      "eval_loss": 0.4269878566265106,
      "eval_mse": 0.4269687533378601,
      "eval_runtime": 65.9665,
      "eval_samples_per_second": 32.153,
      "eval_steps_per_second": 1.016,
      "step": 363
    },
    {
      "epoch": 33.98,
      "eval_loss": 0.39142194390296936,
      "eval_mse": 0.3913804888725281,
      "eval_runtime": 66.6217,
      "eval_samples_per_second": 31.836,
      "eval_steps_per_second": 1.006,
      "step": 374
    },
    {
      "epoch": 34.98,
      "eval_loss": 0.3899790942668915,
      "eval_mse": 0.38995301723480225,
      "eval_runtime": 65.771,
      "eval_samples_per_second": 32.248,
      "eval_steps_per_second": 1.019,
      "step": 385
    },
    {
      "epoch": 35.98,
      "eval_loss": 0.4031297564506531,
      "eval_mse": 0.4031302034854889,
      "eval_runtime": 68.033,
      "eval_samples_per_second": 31.176,
      "eval_steps_per_second": 0.985,
      "step": 396
    },
    {
      "epoch": 36.98,
      "eval_loss": 0.373826265335083,
      "eval_mse": 0.3738201856613159,
      "eval_runtime": 66.1644,
      "eval_samples_per_second": 32.057,
      "eval_steps_per_second": 1.013,
      "step": 407
    },
    {
      "epoch": 37.98,
      "eval_loss": 0.37409740686416626,
      "eval_mse": 0.37407544255256653,
      "eval_runtime": 65.7007,
      "eval_samples_per_second": 32.283,
      "eval_steps_per_second": 1.02,
      "step": 418
    },
    {
      "epoch": 38.98,
      "eval_loss": 0.41098639369010925,
      "eval_mse": 0.4109634459018707,
      "eval_runtime": 65.8334,
      "eval_samples_per_second": 32.218,
      "eval_steps_per_second": 1.018,
      "step": 429
    },
    {
      "epoch": 39.98,
      "eval_loss": 0.38580140471458435,
      "eval_mse": 0.3857785165309906,
      "eval_runtime": 65.912,
      "eval_samples_per_second": 32.179,
      "eval_steps_per_second": 1.017,
      "step": 440
    },
    {
      "epoch": 40.98,
      "eval_loss": 0.40168315172195435,
      "eval_mse": 0.4016563296318054,
      "eval_runtime": 67.322,
      "eval_samples_per_second": 31.505,
      "eval_steps_per_second": 0.995,
      "step": 451
    },
    {
      "epoch": 41.98,
      "eval_loss": 0.3875749111175537,
      "eval_mse": 0.3875587284564972,
      "eval_runtime": 65.9445,
      "eval_samples_per_second": 32.163,
      "eval_steps_per_second": 1.016,
      "step": 462
    },
    {
      "epoch": 42.98,
      "eval_loss": 0.401607483625412,
      "eval_mse": 0.4015834629535675,
      "eval_runtime": 66.235,
      "eval_samples_per_second": 32.022,
      "eval_steps_per_second": 1.012,
      "step": 473
    },
    {
      "epoch": 43.98,
      "eval_loss": 0.3939042389392853,
      "eval_mse": 0.3938945233821869,
      "eval_runtime": 66.0054,
      "eval_samples_per_second": 32.134,
      "eval_steps_per_second": 1.015,
      "step": 484
    },
    {
      "epoch": 44.98,
      "eval_loss": 0.40803390741348267,
      "eval_mse": 0.40802931785583496,
      "eval_runtime": 66.0842,
      "eval_samples_per_second": 32.095,
      "eval_steps_per_second": 1.014,
      "step": 495
    },
    {
      "epoch": 45.44,
      "learning_rate": 3.03030303030303e-05,
      "loss": 0.4034,
      "step": 500
    },
    {
      "epoch": 45.98,
      "eval_loss": 0.38819119334220886,
      "eval_mse": 0.38818415999412537,
      "eval_runtime": 67.7262,
      "eval_samples_per_second": 31.317,
      "eval_steps_per_second": 0.989,
      "step": 506
    },
    {
      "epoch": 46.98,
      "eval_loss": 0.4062108099460602,
      "eval_mse": 0.4061962068080902,
      "eval_runtime": 63.6037,
      "eval_samples_per_second": 33.347,
      "eval_steps_per_second": 1.053,
      "step": 517
    },
    {
      "epoch": 47.98,
      "eval_loss": 0.38834279775619507,
      "eval_mse": 0.38832658529281616,
      "eval_runtime": 64.2256,
      "eval_samples_per_second": 33.024,
      "eval_steps_per_second": 1.043,
      "step": 528
    },
    {
      "epoch": 48.98,
      "eval_loss": 0.3969601094722748,
      "eval_mse": 0.3969435691833496,
      "eval_runtime": 63.6409,
      "eval_samples_per_second": 33.328,
      "eval_steps_per_second": 1.053,
      "step": 539
    },
    {
      "epoch": 49.98,
      "eval_loss": 0.3963707685470581,
      "eval_mse": 0.3963526785373688,
      "eval_runtime": 63.4841,
      "eval_samples_per_second": 33.41,
      "eval_steps_per_second": 1.055,
      "step": 550
    }
  ],
  "max_steps": 550,
  "num_train_epochs": 50,
  "total_flos": 1.603121844978697e+20,
  "trial_name": null,
  "trial_params": null
}