|
{ |
|
"best_metric": 0.1746283918619156, |
|
"best_model_checkpoint": "wavlm-english-phoneme/checkpoint-6500", |
|
"epoch": 50.0, |
|
"global_step": 6500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.77, |
|
"learning_rate": 2.97e-05, |
|
"loss": 4.896, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"learning_rate": 5.97e-05, |
|
"loss": 2.5812, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 2.31, |
|
"learning_rate": 8.969999999999998e-05, |
|
"loss": 2.4853, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 3.08, |
|
"learning_rate": 0.0001197, |
|
"loss": 2.2031, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.85, |
|
"learning_rate": 0.00014969999999999998, |
|
"loss": 1.8587, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.85, |
|
"eval_cer": 0.7105220883534137, |
|
"eval_loss": 1.3614039421081543, |
|
"eval_runtime": 21.402, |
|
"eval_samples_per_second": 21.587, |
|
"eval_steps_per_second": 2.71, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.62, |
|
"learning_rate": 0.00017969999999999998, |
|
"loss": 1.1164, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 5.38, |
|
"learning_rate": 0.00020969999999999997, |
|
"loss": 0.7271, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 6.15, |
|
"learning_rate": 0.0002397, |
|
"loss": 0.5784, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 6.92, |
|
"learning_rate": 0.0002697, |
|
"loss": 0.4487, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 7.69, |
|
"learning_rate": 0.00029969999999999997, |
|
"loss": 0.3517, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 7.69, |
|
"eval_cer": 0.16610441767068274, |
|
"eval_loss": 0.3352901339530945, |
|
"eval_runtime": 21.5161, |
|
"eval_samples_per_second": 21.472, |
|
"eval_steps_per_second": 2.696, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 8.46, |
|
"learning_rate": 0.00029459999999999995, |
|
"loss": 0.3089, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 9.23, |
|
"learning_rate": 0.00028914545454545454, |
|
"loss": 0.2465, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 0.00028369090909090907, |
|
"loss": 0.2099, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 10.77, |
|
"learning_rate": 0.0002782363636363636, |
|
"loss": 0.1649, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 11.54, |
|
"learning_rate": 0.00027278181818181813, |
|
"loss": 0.1473, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 11.54, |
|
"eval_cer": 0.11325301204819277, |
|
"eval_loss": 0.23726579546928406, |
|
"eval_runtime": 34.3746, |
|
"eval_samples_per_second": 13.44, |
|
"eval_steps_per_second": 1.687, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 12.31, |
|
"learning_rate": 0.0002673272727272727, |
|
"loss": 0.1335, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 13.08, |
|
"learning_rate": 0.00026187272727272725, |
|
"loss": 0.118, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 13.85, |
|
"learning_rate": 0.00025641818181818183, |
|
"loss": 0.1083, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 14.62, |
|
"learning_rate": 0.00025096363636363636, |
|
"loss": 0.106, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 15.38, |
|
"learning_rate": 0.0002455090909090909, |
|
"loss": 0.0799, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 15.38, |
|
"eval_cer": 0.09397590361445783, |
|
"eval_loss": 0.20781992375850677, |
|
"eval_runtime": 21.3113, |
|
"eval_samples_per_second": 21.679, |
|
"eval_steps_per_second": 2.722, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 16.15, |
|
"learning_rate": 0.00024005454545454545, |
|
"loss": 0.0767, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 16.92, |
|
"learning_rate": 0.00023459999999999998, |
|
"loss": 0.0761, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 17.69, |
|
"learning_rate": 0.00022914545454545454, |
|
"loss": 0.0705, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 18.46, |
|
"learning_rate": 0.00022369090909090907, |
|
"loss": 0.0619, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 19.23, |
|
"learning_rate": 0.00021823636363636363, |
|
"loss": 0.0634, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 19.23, |
|
"eval_cer": 0.08538152610441767, |
|
"eval_loss": 0.20878814160823822, |
|
"eval_runtime": 20.9398, |
|
"eval_samples_per_second": 22.063, |
|
"eval_steps_per_second": 2.77, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 0.00021278181818181816, |
|
"loss": 0.0556, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 20.77, |
|
"learning_rate": 0.00020732727272727272, |
|
"loss": 0.0562, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 21.54, |
|
"learning_rate": 0.00020187272727272725, |
|
"loss": 0.0556, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 22.31, |
|
"learning_rate": 0.0001964181818181818, |
|
"loss": 0.0483, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 23.08, |
|
"learning_rate": 0.00019096363636363634, |
|
"loss": 0.0472, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 23.08, |
|
"eval_cer": 0.0767871485943775, |
|
"eval_loss": 0.18513090908527374, |
|
"eval_runtime": 21.0154, |
|
"eval_samples_per_second": 21.984, |
|
"eval_steps_per_second": 2.76, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 23.85, |
|
"learning_rate": 0.00018550909090909087, |
|
"loss": 0.044, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 24.62, |
|
"learning_rate": 0.00018005454545454543, |
|
"loss": 0.0409, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 25.38, |
|
"learning_rate": 0.00017459999999999996, |
|
"loss": 0.0386, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 26.15, |
|
"learning_rate": 0.00016914545454545452, |
|
"loss": 0.0397, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 26.92, |
|
"learning_rate": 0.00016369090909090905, |
|
"loss": 0.0337, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 26.92, |
|
"eval_cer": 0.0757429718875502, |
|
"eval_loss": 0.2069997787475586, |
|
"eval_runtime": 21.3619, |
|
"eval_samples_per_second": 21.627, |
|
"eval_steps_per_second": 2.715, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 27.69, |
|
"learning_rate": 0.00015823636363636364, |
|
"loss": 0.0368, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 28.46, |
|
"learning_rate": 0.0001527818181818182, |
|
"loss": 0.0329, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 29.23, |
|
"learning_rate": 0.0001473272727272727, |
|
"loss": 0.0306, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"learning_rate": 0.00014187272727272726, |
|
"loss": 0.0298, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 30.77, |
|
"learning_rate": 0.0001364181818181818, |
|
"loss": 0.0283, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 30.77, |
|
"eval_cer": 0.07180722891566266, |
|
"eval_loss": 0.19239871203899384, |
|
"eval_runtime": 34.8631, |
|
"eval_samples_per_second": 13.252, |
|
"eval_steps_per_second": 1.664, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 31.54, |
|
"learning_rate": 0.00013096363636363635, |
|
"loss": 0.0256, |
|
"step": 4100 |
|
}, |
|
{ |
|
"epoch": 32.31, |
|
"learning_rate": 0.0001255090909090909, |
|
"loss": 0.0257, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 33.08, |
|
"learning_rate": 0.00012005454545454545, |
|
"loss": 0.0238, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 33.85, |
|
"learning_rate": 0.0001146, |
|
"loss": 0.0228, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 34.62, |
|
"learning_rate": 0.00010919999999999998, |
|
"loss": 0.0242, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 34.62, |
|
"eval_cer": 0.0668273092369478, |
|
"eval_loss": 0.18180887401103973, |
|
"eval_runtime": 20.8913, |
|
"eval_samples_per_second": 22.115, |
|
"eval_steps_per_second": 2.776, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 35.38, |
|
"learning_rate": 0.00010374545454545453, |
|
"loss": 0.0209, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 36.15, |
|
"learning_rate": 9.829090909090907e-05, |
|
"loss": 0.0192, |
|
"step": 4700 |
|
}, |
|
{ |
|
"epoch": 36.92, |
|
"learning_rate": 9.283636363636363e-05, |
|
"loss": 0.0171, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 37.69, |
|
"learning_rate": 8.738181818181818e-05, |
|
"loss": 0.0205, |
|
"step": 4900 |
|
}, |
|
{ |
|
"epoch": 38.46, |
|
"learning_rate": 8.192727272727272e-05, |
|
"loss": 0.0187, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 38.46, |
|
"eval_cer": 0.06730923694779116, |
|
"eval_loss": 0.19057846069335938, |
|
"eval_runtime": 27.3046, |
|
"eval_samples_per_second": 16.92, |
|
"eval_steps_per_second": 2.124, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 39.23, |
|
"learning_rate": 7.647272727272727e-05, |
|
"loss": 0.0159, |
|
"step": 5100 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"learning_rate": 7.101818181818181e-05, |
|
"loss": 0.0154, |
|
"step": 5200 |
|
}, |
|
{ |
|
"epoch": 40.77, |
|
"learning_rate": 6.556363636363636e-05, |
|
"loss": 0.0165, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 41.54, |
|
"learning_rate": 6.01090909090909e-05, |
|
"loss": 0.0135, |
|
"step": 5400 |
|
}, |
|
{ |
|
"epoch": 42.31, |
|
"learning_rate": 5.465454545454545e-05, |
|
"loss": 0.0156, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 42.31, |
|
"eval_cer": 0.06409638554216868, |
|
"eval_loss": 0.17488864064216614, |
|
"eval_runtime": 20.9298, |
|
"eval_samples_per_second": 22.074, |
|
"eval_steps_per_second": 2.771, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 43.08, |
|
"learning_rate": 4.9199999999999997e-05, |
|
"loss": 0.0137, |
|
"step": 5600 |
|
}, |
|
{ |
|
"epoch": 43.85, |
|
"learning_rate": 4.374545454545454e-05, |
|
"loss": 0.0138, |
|
"step": 5700 |
|
}, |
|
{ |
|
"epoch": 44.62, |
|
"learning_rate": 3.8290909090909086e-05, |
|
"loss": 0.0117, |
|
"step": 5800 |
|
}, |
|
{ |
|
"epoch": 45.38, |
|
"learning_rate": 3.283636363636364e-05, |
|
"loss": 0.0132, |
|
"step": 5900 |
|
}, |
|
{ |
|
"epoch": 46.15, |
|
"learning_rate": 2.738181818181818e-05, |
|
"loss": 0.0107, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 46.15, |
|
"eval_cer": 0.060481927710843375, |
|
"eval_loss": 0.17818936705589294, |
|
"eval_runtime": 20.9013, |
|
"eval_samples_per_second": 22.104, |
|
"eval_steps_per_second": 2.775, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 46.92, |
|
"learning_rate": 2.1927272727272727e-05, |
|
"loss": 0.0124, |
|
"step": 6100 |
|
}, |
|
{ |
|
"epoch": 47.69, |
|
"learning_rate": 1.647272727272727e-05, |
|
"loss": 0.0119, |
|
"step": 6200 |
|
}, |
|
{ |
|
"epoch": 48.46, |
|
"learning_rate": 1.1018181818181816e-05, |
|
"loss": 0.0097, |
|
"step": 6300 |
|
}, |
|
{ |
|
"epoch": 49.23, |
|
"learning_rate": 5.563636363636363e-06, |
|
"loss": 0.0105, |
|
"step": 6400 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 1.0909090909090908e-07, |
|
"loss": 0.0099, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.06088353413654619, |
|
"eval_loss": 0.1746283918619156, |
|
"eval_runtime": 27.3261, |
|
"eval_samples_per_second": 16.907, |
|
"eval_steps_per_second": 2.123, |
|
"step": 6500 |
|
} |
|
], |
|
"max_steps": 6500, |
|
"num_train_epochs": 50, |
|
"total_flos": 1.985767056261625e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|