|
{ |
|
"best_metric": 1.0679948329925537, |
|
"best_model_checkpoint": "asd_pronunciation_w2v_xlsr-300m/checkpoint-99", |
|
"epoch": 49.977777777777774, |
|
"global_step": 550, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.98, |
|
"eval_accuracy": 0.33144742250442505, |
|
"eval_loss": 1.5670545101165771, |
|
"eval_runtime": 62.8235, |
|
"eval_samples_per_second": 33.761, |
|
"eval_steps_per_second": 1.066, |
|
"step": 11 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_accuracy": 0.39273926615715027, |
|
"eval_loss": 1.3582004308700562, |
|
"eval_runtime": 62.2914, |
|
"eval_samples_per_second": 34.05, |
|
"eval_steps_per_second": 1.076, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 2.98, |
|
"eval_accuracy": 0.380952388048172, |
|
"eval_loss": 1.3765946626663208, |
|
"eval_runtime": 63.9238, |
|
"eval_samples_per_second": 33.18, |
|
"eval_steps_per_second": 1.048, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 3.98, |
|
"eval_accuracy": 0.4186704456806183, |
|
"eval_loss": 1.3837833404541016, |
|
"eval_runtime": 63.6397, |
|
"eval_samples_per_second": 33.328, |
|
"eval_steps_per_second": 1.053, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 4.98, |
|
"eval_accuracy": 0.3663366436958313, |
|
"eval_loss": 1.5986249446868896, |
|
"eval_runtime": 63.7365, |
|
"eval_samples_per_second": 33.278, |
|
"eval_steps_per_second": 1.051, |
|
"step": 55 |
|
}, |
|
{ |
|
"epoch": 5.98, |
|
"eval_accuracy": 0.42904290556907654, |
|
"eval_loss": 1.8822154998779297, |
|
"eval_runtime": 63.6958, |
|
"eval_samples_per_second": 33.299, |
|
"eval_steps_per_second": 1.052, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 6.98, |
|
"eval_accuracy": 0.34983497858047485, |
|
"eval_loss": 1.865776538848877, |
|
"eval_runtime": 63.1847, |
|
"eval_samples_per_second": 33.568, |
|
"eval_steps_per_second": 1.06, |
|
"step": 77 |
|
}, |
|
{ |
|
"epoch": 7.98, |
|
"eval_accuracy": 0.4502592980861664, |
|
"eval_loss": 1.966166377067566, |
|
"eval_runtime": 63.6503, |
|
"eval_samples_per_second": 33.323, |
|
"eval_steps_per_second": 1.053, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 8.98, |
|
"eval_accuracy": 0.6855257153511047, |
|
"eval_loss": 1.0679948329925537, |
|
"eval_runtime": 63.1701, |
|
"eval_samples_per_second": 33.576, |
|
"eval_steps_per_second": 1.061, |
|
"step": 99 |
|
}, |
|
{ |
|
"epoch": 9.98, |
|
"eval_accuracy": 0.6539368033409119, |
|
"eval_loss": 1.1463075876235962, |
|
"eval_runtime": 63.3309, |
|
"eval_samples_per_second": 33.491, |
|
"eval_steps_per_second": 1.058, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 10.98, |
|
"eval_accuracy": 0.7157001495361328, |
|
"eval_loss": 1.1053473949432373, |
|
"eval_runtime": 63.7039, |
|
"eval_samples_per_second": 33.295, |
|
"eval_steps_per_second": 1.052, |
|
"step": 121 |
|
}, |
|
{ |
|
"epoch": 11.98, |
|
"eval_accuracy": 0.5836869478225708, |
|
"eval_loss": 1.6300278902053833, |
|
"eval_runtime": 63.4359, |
|
"eval_samples_per_second": 33.435, |
|
"eval_steps_per_second": 1.056, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 12.98, |
|
"eval_accuracy": 0.697312593460083, |
|
"eval_loss": 1.190132975578308, |
|
"eval_runtime": 62.8623, |
|
"eval_samples_per_second": 33.74, |
|
"eval_steps_per_second": 1.066, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 13.98, |
|
"eval_accuracy": 0.5761433243751526, |
|
"eval_loss": 1.677795171737671, |
|
"eval_runtime": 63.1508, |
|
"eval_samples_per_second": 33.586, |
|
"eval_steps_per_second": 1.061, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 14.98, |
|
"eval_accuracy": 0.7072135806083679, |
|
"eval_loss": 1.2646026611328125, |
|
"eval_runtime": 64.2737, |
|
"eval_samples_per_second": 33.0, |
|
"eval_steps_per_second": 1.042, |
|
"step": 165 |
|
}, |
|
{ |
|
"epoch": 15.98, |
|
"eval_accuracy": 0.5535125136375427, |
|
"eval_loss": 1.866857647895813, |
|
"eval_runtime": 63.6272, |
|
"eval_samples_per_second": 33.335, |
|
"eval_steps_per_second": 1.053, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 16.98, |
|
"eval_accuracy": 0.5700141191482544, |
|
"eval_loss": 1.911484956741333, |
|
"eval_runtime": 63.0574, |
|
"eval_samples_per_second": 33.636, |
|
"eval_steps_per_second": 1.063, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 17.98, |
|
"eval_accuracy": 0.608203649520874, |
|
"eval_loss": 1.748372197151184, |
|
"eval_runtime": 63.9869, |
|
"eval_samples_per_second": 33.147, |
|
"eval_steps_per_second": 1.047, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 18.98, |
|
"eval_accuracy": 0.6209335327148438, |
|
"eval_loss": 1.736160159111023, |
|
"eval_runtime": 63.5615, |
|
"eval_samples_per_second": 33.369, |
|
"eval_steps_per_second": 1.054, |
|
"step": 209 |
|
}, |
|
{ |
|
"epoch": 19.98, |
|
"eval_accuracy": 0.5535125136375427, |
|
"eval_loss": 2.0504212379455566, |
|
"eval_runtime": 63.6231, |
|
"eval_samples_per_second": 33.337, |
|
"eval_steps_per_second": 1.053, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 20.98, |
|
"eval_accuracy": 0.6520509123802185, |
|
"eval_loss": 1.6594103574752808, |
|
"eval_runtime": 63.6587, |
|
"eval_samples_per_second": 33.318, |
|
"eval_steps_per_second": 1.052, |
|
"step": 231 |
|
}, |
|
{ |
|
"epoch": 21.98, |
|
"eval_accuracy": 0.6779820919036865, |
|
"eval_loss": 1.5675663948059082, |
|
"eval_runtime": 64.5637, |
|
"eval_samples_per_second": 32.851, |
|
"eval_steps_per_second": 1.038, |
|
"step": 242 |
|
}, |
|
{ |
|
"epoch": 22.98, |
|
"eval_accuracy": 0.6737387776374817, |
|
"eval_loss": 1.6316275596618652, |
|
"eval_runtime": 63.4257, |
|
"eval_samples_per_second": 33.441, |
|
"eval_steps_per_second": 1.056, |
|
"step": 253 |
|
}, |
|
{ |
|
"epoch": 23.98, |
|
"eval_accuracy": 0.5983026623725891, |
|
"eval_loss": 1.9427396059036255, |
|
"eval_runtime": 63.6629, |
|
"eval_samples_per_second": 33.316, |
|
"eval_steps_per_second": 1.052, |
|
"step": 264 |
|
}, |
|
{ |
|
"epoch": 24.98, |
|
"eval_accuracy": 0.6619518995285034, |
|
"eval_loss": 1.7251100540161133, |
|
"eval_runtime": 63.8986, |
|
"eval_samples_per_second": 33.193, |
|
"eval_steps_per_second": 1.049, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 25.98, |
|
"eval_accuracy": 0.7133427858352661, |
|
"eval_loss": 1.4861173629760742, |
|
"eval_runtime": 63.105, |
|
"eval_samples_per_second": 33.611, |
|
"eval_steps_per_second": 1.062, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 26.98, |
|
"eval_accuracy": 0.6388496160507202, |
|
"eval_loss": 1.8551920652389526, |
|
"eval_runtime": 63.3692, |
|
"eval_samples_per_second": 33.471, |
|
"eval_steps_per_second": 1.057, |
|
"step": 297 |
|
}, |
|
{ |
|
"epoch": 27.98, |
|
"eval_accuracy": 0.6218764781951904, |
|
"eval_loss": 1.9755550622940063, |
|
"eval_runtime": 63.7438, |
|
"eval_samples_per_second": 33.274, |
|
"eval_steps_per_second": 1.051, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 28.98, |
|
"eval_accuracy": 0.5879302024841309, |
|
"eval_loss": 2.2480831146240234, |
|
"eval_runtime": 62.9459, |
|
"eval_samples_per_second": 33.696, |
|
"eval_steps_per_second": 1.064, |
|
"step": 319 |
|
}, |
|
{ |
|
"epoch": 29.98, |
|
"eval_accuracy": 0.6176331639289856, |
|
"eval_loss": 1.9868534803390503, |
|
"eval_runtime": 63.9115, |
|
"eval_samples_per_second": 33.187, |
|
"eval_steps_per_second": 1.048, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 30.98, |
|
"eval_accuracy": 0.6991984844207764, |
|
"eval_loss": 1.6001139879226685, |
|
"eval_runtime": 62.9701, |
|
"eval_samples_per_second": 33.683, |
|
"eval_steps_per_second": 1.064, |
|
"step": 341 |
|
}, |
|
{ |
|
"epoch": 31.98, |
|
"eval_accuracy": 0.6562942266464233, |
|
"eval_loss": 1.80760657787323, |
|
"eval_runtime": 64.5355, |
|
"eval_samples_per_second": 32.866, |
|
"eval_steps_per_second": 1.038, |
|
"step": 352 |
|
}, |
|
{ |
|
"epoch": 32.98, |
|
"eval_accuracy": 0.6539368033409119, |
|
"eval_loss": 1.8803389072418213, |
|
"eval_runtime": 63.8068, |
|
"eval_samples_per_second": 33.241, |
|
"eval_steps_per_second": 1.05, |
|
"step": 363 |
|
}, |
|
{ |
|
"epoch": 33.98, |
|
"eval_accuracy": 0.6308345198631287, |
|
"eval_loss": 1.9857879877090454, |
|
"eval_runtime": 63.5545, |
|
"eval_samples_per_second": 33.373, |
|
"eval_steps_per_second": 1.054, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 34.98, |
|
"eval_accuracy": 0.6228194236755371, |
|
"eval_loss": 2.016218900680542, |
|
"eval_runtime": 63.1093, |
|
"eval_samples_per_second": 33.608, |
|
"eval_steps_per_second": 1.062, |
|
"step": 385 |
|
}, |
|
{ |
|
"epoch": 35.98, |
|
"eval_accuracy": 0.6247053146362305, |
|
"eval_loss": 1.9806338548660278, |
|
"eval_runtime": 63.643, |
|
"eval_samples_per_second": 33.327, |
|
"eval_steps_per_second": 1.053, |
|
"step": 396 |
|
}, |
|
{ |
|
"epoch": 36.98, |
|
"eval_accuracy": 0.6148043274879456, |
|
"eval_loss": 2.0684027671813965, |
|
"eval_runtime": 63.1391, |
|
"eval_samples_per_second": 33.593, |
|
"eval_steps_per_second": 1.061, |
|
"step": 407 |
|
}, |
|
{ |
|
"epoch": 37.98, |
|
"eval_accuracy": 0.6826968193054199, |
|
"eval_loss": 1.7208051681518555, |
|
"eval_runtime": 63.3764, |
|
"eval_samples_per_second": 33.467, |
|
"eval_steps_per_second": 1.057, |
|
"step": 418 |
|
}, |
|
{ |
|
"epoch": 38.98, |
|
"eval_accuracy": 0.6676096320152283, |
|
"eval_loss": 1.7736769914627075, |
|
"eval_runtime": 63.0716, |
|
"eval_samples_per_second": 33.628, |
|
"eval_steps_per_second": 1.062, |
|
"step": 429 |
|
}, |
|
{ |
|
"epoch": 39.98, |
|
"eval_accuracy": 0.6940122842788696, |
|
"eval_loss": 1.7225761413574219, |
|
"eval_runtime": 64.0078, |
|
"eval_samples_per_second": 33.137, |
|
"eval_steps_per_second": 1.047, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 40.98, |
|
"eval_accuracy": 0.606789231300354, |
|
"eval_loss": 2.0414962768554688, |
|
"eval_runtime": 63.4689, |
|
"eval_samples_per_second": 33.418, |
|
"eval_steps_per_second": 1.056, |
|
"step": 451 |
|
}, |
|
{ |
|
"epoch": 41.98, |
|
"eval_accuracy": 0.6214050054550171, |
|
"eval_loss": 2.019111394882202, |
|
"eval_runtime": 63.5976, |
|
"eval_samples_per_second": 33.35, |
|
"eval_steps_per_second": 1.053, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 42.98, |
|
"eval_accuracy": 0.6379066705703735, |
|
"eval_loss": 1.947460412979126, |
|
"eval_runtime": 63.6957, |
|
"eval_samples_per_second": 33.299, |
|
"eval_steps_per_second": 1.052, |
|
"step": 473 |
|
}, |
|
{ |
|
"epoch": 43.98, |
|
"eval_accuracy": 0.669966995716095, |
|
"eval_loss": 1.8389097452163696, |
|
"eval_runtime": 64.1144, |
|
"eval_samples_per_second": 33.081, |
|
"eval_steps_per_second": 1.045, |
|
"step": 484 |
|
}, |
|
{ |
|
"epoch": 44.98, |
|
"eval_accuracy": 0.6666666865348816, |
|
"eval_loss": 1.814638376235962, |
|
"eval_runtime": 63.7225, |
|
"eval_samples_per_second": 33.285, |
|
"eval_steps_per_second": 1.051, |
|
"step": 495 |
|
}, |
|
{ |
|
"epoch": 45.44, |
|
"learning_rate": 3.03030303030303e-05, |
|
"loss": 0.3177, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 45.98, |
|
"eval_accuracy": 0.6718528866767883, |
|
"eval_loss": 1.79548978805542, |
|
"eval_runtime": 63.2169, |
|
"eval_samples_per_second": 33.551, |
|
"eval_steps_per_second": 1.06, |
|
"step": 506 |
|
}, |
|
{ |
|
"epoch": 46.98, |
|
"eval_accuracy": 0.65865159034729, |
|
"eval_loss": 1.9061682224273682, |
|
"eval_runtime": 64.47, |
|
"eval_samples_per_second": 32.899, |
|
"eval_steps_per_second": 1.039, |
|
"step": 517 |
|
}, |
|
{ |
|
"epoch": 47.98, |
|
"eval_accuracy": 0.6643092632293701, |
|
"eval_loss": 1.8877029418945312, |
|
"eval_runtime": 63.3351, |
|
"eval_samples_per_second": 33.489, |
|
"eval_steps_per_second": 1.058, |
|
"step": 528 |
|
}, |
|
{ |
|
"epoch": 48.98, |
|
"eval_accuracy": 0.6694955229759216, |
|
"eval_loss": 1.8578468561172485, |
|
"eval_runtime": 63.6561, |
|
"eval_samples_per_second": 33.32, |
|
"eval_steps_per_second": 1.053, |
|
"step": 539 |
|
}, |
|
{ |
|
"epoch": 49.98, |
|
"eval_accuracy": 0.6690240502357483, |
|
"eval_loss": 1.8590630292892456, |
|
"eval_runtime": 62.2809, |
|
"eval_samples_per_second": 34.055, |
|
"eval_steps_per_second": 1.076, |
|
"step": 550 |
|
} |
|
], |
|
"max_steps": 550, |
|
"num_train_epochs": 50, |
|
"total_flos": 1.6031529967362595e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|