{ "best_metric": 0.30745795369148254, "best_model_checkpoint": "asd_pronunciation_w2v_xlsr-reg/checkpoint-99", "epoch": 49.977777777777774, "global_step": 550, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.98, "eval_loss": 0.8269791603088379, "eval_mse": 0.8274638056755066, "eval_runtime": 67.3404, "eval_samples_per_second": 31.497, "eval_steps_per_second": 0.995, "step": 11 }, { "epoch": 1.98, "eval_loss": 0.4631172716617584, "eval_mse": 0.46300947666168213, "eval_runtime": 67.2163, "eval_samples_per_second": 31.555, "eval_steps_per_second": 0.997, "step": 22 }, { "epoch": 2.98, "eval_loss": 0.351409912109375, "eval_mse": 0.3515050709247589, "eval_runtime": 67.5563, "eval_samples_per_second": 31.396, "eval_steps_per_second": 0.992, "step": 33 }, { "epoch": 3.98, "eval_loss": 0.3585782051086426, "eval_mse": 0.35852691531181335, "eval_runtime": 69.7976, "eval_samples_per_second": 30.388, "eval_steps_per_second": 0.96, "step": 44 }, { "epoch": 4.98, "eval_loss": 0.4412296712398529, "eval_mse": 0.4412075877189636, "eval_runtime": 79.1138, "eval_samples_per_second": 26.809, "eval_steps_per_second": 0.847, "step": 55 }, { "epoch": 5.98, "eval_loss": 0.430486798286438, "eval_mse": 0.43049314618110657, "eval_runtime": 72.5547, "eval_samples_per_second": 29.233, "eval_steps_per_second": 0.923, "step": 66 }, { "epoch": 6.98, "eval_loss": 0.42916765809059143, "eval_mse": 0.4291659891605377, "eval_runtime": 95.5528, "eval_samples_per_second": 22.197, "eval_steps_per_second": 0.701, "step": 77 }, { "epoch": 7.98, "eval_loss": 0.4343053996562958, "eval_mse": 0.43428245186805725, "eval_runtime": 66.5007, "eval_samples_per_second": 31.894, "eval_steps_per_second": 1.008, "step": 88 }, { "epoch": 8.98, "eval_loss": 0.30745795369148254, "eval_mse": 0.3074318766593933, "eval_runtime": 66.2359, "eval_samples_per_second": 32.022, "eval_steps_per_second": 1.012, "step": 99 }, { "epoch": 9.98, "eval_loss": 0.42939332127571106, "eval_mse": 0.4293690323829651, "eval_runtime": 66.3865, "eval_samples_per_second": 31.949, "eval_steps_per_second": 1.009, "step": 110 }, { "epoch": 10.98, "eval_loss": 0.3727492094039917, "eval_mse": 0.3727482855319977, "eval_runtime": 66.8857, "eval_samples_per_second": 31.711, "eval_steps_per_second": 1.002, "step": 121 }, { "epoch": 11.98, "eval_loss": 0.42278197407722473, "eval_mse": 0.42277276515960693, "eval_runtime": 65.5197, "eval_samples_per_second": 32.372, "eval_steps_per_second": 1.023, "step": 132 }, { "epoch": 12.98, "eval_loss": 0.4014572203159332, "eval_mse": 0.40141549706459045, "eval_runtime": 65.6627, "eval_samples_per_second": 32.301, "eval_steps_per_second": 1.02, "step": 143 }, { "epoch": 13.98, "eval_loss": 0.37818050384521484, "eval_mse": 0.37818947434425354, "eval_runtime": 66.0031, "eval_samples_per_second": 32.135, "eval_steps_per_second": 1.015, "step": 154 }, { "epoch": 14.98, "eval_loss": 0.4358225166797638, "eval_mse": 0.43578916788101196, "eval_runtime": 65.7571, "eval_samples_per_second": 32.255, "eval_steps_per_second": 1.019, "step": 165 }, { "epoch": 15.98, "eval_loss": 0.36039263010025024, "eval_mse": 0.3603877127170563, "eval_runtime": 67.6323, "eval_samples_per_second": 31.361, "eval_steps_per_second": 0.991, "step": 176 }, { "epoch": 16.98, "eval_loss": 0.40446653962135315, "eval_mse": 0.40447959303855896, "eval_runtime": 66.1021, "eval_samples_per_second": 32.087, "eval_steps_per_second": 1.014, "step": 187 }, { "epoch": 17.98, "eval_loss": 0.3638509213924408, "eval_mse": 0.3638397455215454, "eval_runtime": 66.1765, "eval_samples_per_second": 32.051, "eval_steps_per_second": 1.012, "step": 198 }, { "epoch": 18.98, "eval_loss": 0.4001483619213104, "eval_mse": 0.400104284286499, "eval_runtime": 66.5235, "eval_samples_per_second": 31.883, "eval_steps_per_second": 1.007, "step": 209 }, { "epoch": 19.98, "eval_loss": 0.3836788535118103, "eval_mse": 0.38362112641334534, "eval_runtime": 65.5397, "eval_samples_per_second": 32.362, "eval_steps_per_second": 1.022, "step": 220 }, { "epoch": 20.98, "eval_loss": 0.3813478350639343, "eval_mse": 0.3813202679157257, "eval_runtime": 67.0847, "eval_samples_per_second": 31.617, "eval_steps_per_second": 0.999, "step": 231 }, { "epoch": 21.98, "eval_loss": 0.3911483883857727, "eval_mse": 0.39113306999206543, "eval_runtime": 66.4329, "eval_samples_per_second": 31.927, "eval_steps_per_second": 1.009, "step": 242 }, { "epoch": 22.98, "eval_loss": 0.43994417786598206, "eval_mse": 0.4399244487285614, "eval_runtime": 66.1358, "eval_samples_per_second": 32.07, "eval_steps_per_second": 1.013, "step": 253 }, { "epoch": 23.98, "eval_loss": 0.4228975772857666, "eval_mse": 0.42288002371788025, "eval_runtime": 66.6907, "eval_samples_per_second": 31.804, "eval_steps_per_second": 1.005, "step": 264 }, { "epoch": 24.98, "eval_loss": 0.4192221462726593, "eval_mse": 0.4191807508468628, "eval_runtime": 65.8241, "eval_samples_per_second": 32.222, "eval_steps_per_second": 1.018, "step": 275 }, { "epoch": 25.98, "eval_loss": 0.40975797176361084, "eval_mse": 0.4097472131252289, "eval_runtime": 67.5766, "eval_samples_per_second": 31.387, "eval_steps_per_second": 0.991, "step": 286 }, { "epoch": 26.98, "eval_loss": 0.3760901093482971, "eval_mse": 0.37607377767562866, "eval_runtime": 65.9157, "eval_samples_per_second": 32.177, "eval_steps_per_second": 1.016, "step": 297 }, { "epoch": 27.98, "eval_loss": 0.389096200466156, "eval_mse": 0.3890584111213684, "eval_runtime": 65.956, "eval_samples_per_second": 32.158, "eval_steps_per_second": 1.016, "step": 308 }, { "epoch": 28.98, "eval_loss": 0.4243176579475403, "eval_mse": 0.4242975115776062, "eval_runtime": 66.4794, "eval_samples_per_second": 31.905, "eval_steps_per_second": 1.008, "step": 319 }, { "epoch": 29.98, "eval_loss": 0.4235914349555969, "eval_mse": 0.4235744774341583, "eval_runtime": 66.2277, "eval_samples_per_second": 32.026, "eval_steps_per_second": 1.012, "step": 330 }, { "epoch": 30.98, "eval_loss": 0.4235081076622009, "eval_mse": 0.42347782850265503, "eval_runtime": 66.6381, "eval_samples_per_second": 31.829, "eval_steps_per_second": 1.005, "step": 341 }, { "epoch": 31.98, "eval_loss": 0.4236636757850647, "eval_mse": 0.4236546456813812, "eval_runtime": 65.6032, "eval_samples_per_second": 32.331, "eval_steps_per_second": 1.021, "step": 352 }, { "epoch": 32.98, "eval_loss": 0.4269878566265106, "eval_mse": 0.4269687533378601, "eval_runtime": 65.9665, "eval_samples_per_second": 32.153, "eval_steps_per_second": 1.016, "step": 363 }, { "epoch": 33.98, "eval_loss": 0.39142194390296936, "eval_mse": 0.3913804888725281, "eval_runtime": 66.6217, "eval_samples_per_second": 31.836, "eval_steps_per_second": 1.006, "step": 374 }, { "epoch": 34.98, "eval_loss": 0.3899790942668915, "eval_mse": 0.38995301723480225, "eval_runtime": 65.771, "eval_samples_per_second": 32.248, "eval_steps_per_second": 1.019, "step": 385 }, { "epoch": 35.98, "eval_loss": 0.4031297564506531, "eval_mse": 0.4031302034854889, "eval_runtime": 68.033, "eval_samples_per_second": 31.176, "eval_steps_per_second": 0.985, "step": 396 }, { "epoch": 36.98, "eval_loss": 0.373826265335083, "eval_mse": 0.3738201856613159, "eval_runtime": 66.1644, "eval_samples_per_second": 32.057, "eval_steps_per_second": 1.013, "step": 407 }, { "epoch": 37.98, "eval_loss": 0.37409740686416626, "eval_mse": 0.37407544255256653, "eval_runtime": 65.7007, "eval_samples_per_second": 32.283, "eval_steps_per_second": 1.02, "step": 418 }, { "epoch": 38.98, "eval_loss": 0.41098639369010925, "eval_mse": 0.4109634459018707, "eval_runtime": 65.8334, "eval_samples_per_second": 32.218, "eval_steps_per_second": 1.018, "step": 429 }, { "epoch": 39.98, "eval_loss": 0.38580140471458435, "eval_mse": 0.3857785165309906, "eval_runtime": 65.912, "eval_samples_per_second": 32.179, "eval_steps_per_second": 1.017, "step": 440 }, { "epoch": 40.98, "eval_loss": 0.40168315172195435, "eval_mse": 0.4016563296318054, "eval_runtime": 67.322, "eval_samples_per_second": 31.505, "eval_steps_per_second": 0.995, "step": 451 }, { "epoch": 41.98, "eval_loss": 0.3875749111175537, "eval_mse": 0.3875587284564972, "eval_runtime": 65.9445, "eval_samples_per_second": 32.163, "eval_steps_per_second": 1.016, "step": 462 }, { "epoch": 42.98, "eval_loss": 0.401607483625412, "eval_mse": 0.4015834629535675, "eval_runtime": 66.235, "eval_samples_per_second": 32.022, "eval_steps_per_second": 1.012, "step": 473 }, { "epoch": 43.98, "eval_loss": 0.3939042389392853, "eval_mse": 0.3938945233821869, "eval_runtime": 66.0054, "eval_samples_per_second": 32.134, "eval_steps_per_second": 1.015, "step": 484 }, { "epoch": 44.98, "eval_loss": 0.40803390741348267, "eval_mse": 0.40802931785583496, "eval_runtime": 66.0842, "eval_samples_per_second": 32.095, "eval_steps_per_second": 1.014, "step": 495 }, { "epoch": 45.44, "learning_rate": 3.03030303030303e-05, "loss": 0.4034, "step": 500 }, { "epoch": 45.98, "eval_loss": 0.38819119334220886, "eval_mse": 0.38818415999412537, "eval_runtime": 67.7262, "eval_samples_per_second": 31.317, "eval_steps_per_second": 0.989, "step": 506 }, { "epoch": 46.98, "eval_loss": 0.4062108099460602, "eval_mse": 0.4061962068080902, "eval_runtime": 63.6037, "eval_samples_per_second": 33.347, "eval_steps_per_second": 1.053, "step": 517 }, { "epoch": 47.98, "eval_loss": 0.38834279775619507, "eval_mse": 0.38832658529281616, "eval_runtime": 64.2256, "eval_samples_per_second": 33.024, "eval_steps_per_second": 1.043, "step": 528 }, { "epoch": 48.98, "eval_loss": 0.3969601094722748, "eval_mse": 0.3969435691833496, "eval_runtime": 63.6409, "eval_samples_per_second": 33.328, "eval_steps_per_second": 1.053, "step": 539 }, { "epoch": 49.98, "eval_loss": 0.3963707685470581, "eval_mse": 0.3963526785373688, "eval_runtime": 63.4841, "eval_samples_per_second": 33.41, "eval_steps_per_second": 1.055, "step": 550 } ], "max_steps": 550, "num_train_epochs": 50, "total_flos": 1.603121844978697e+20, "trial_name": null, "trial_params": null }