|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 15.0, |
|
"global_step": 1635, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.92, |
|
"eval_loss": 3.5559017658233643, |
|
"eval_runtime": 96.7485, |
|
"eval_samples_per_second": 17.024, |
|
"eval_steps_per_second": 2.129, |
|
"eval_wer": 1.0, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"eval_loss": 3.0160555839538574, |
|
"eval_runtime": 94.1056, |
|
"eval_samples_per_second": 17.502, |
|
"eval_steps_per_second": 2.189, |
|
"eval_wer": 0.9998978653865795, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 2.75, |
|
"eval_loss": 0.858742356300354, |
|
"eval_runtime": 93.3532, |
|
"eval_samples_per_second": 17.643, |
|
"eval_steps_per_second": 2.207, |
|
"eval_wer": 0.7442549279950975, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 3.67, |
|
"eval_loss": 0.5855284333229065, |
|
"eval_runtime": 95.5853, |
|
"eval_samples_per_second": 17.231, |
|
"eval_steps_per_second": 2.155, |
|
"eval_wer": 0.6120927382289858, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 4.59, |
|
"learning_rate": 0.0003, |
|
"loss": 3.1095, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.59, |
|
"eval_loss": 0.4840559959411621, |
|
"eval_runtime": 95.1562, |
|
"eval_samples_per_second": 17.308, |
|
"eval_steps_per_second": 2.165, |
|
"eval_wer": 0.5203758553773874, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 5.5, |
|
"eval_loss": 0.453325480222702, |
|
"eval_runtime": 94.8597, |
|
"eval_samples_per_second": 17.362, |
|
"eval_steps_per_second": 2.172, |
|
"eval_wer": 0.49228883668675316, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 6.42, |
|
"eval_loss": 0.41565799713134766, |
|
"eval_runtime": 94.1725, |
|
"eval_samples_per_second": 17.489, |
|
"eval_steps_per_second": 2.187, |
|
"eval_wer": 0.43417424165049534, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 7.34, |
|
"eval_loss": 0.4304071068763733, |
|
"eval_runtime": 94.2253, |
|
"eval_samples_per_second": 17.479, |
|
"eval_steps_per_second": 2.186, |
|
"eval_wer": 0.43335716474313146, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 8.26, |
|
"eval_loss": 0.4097221791744232, |
|
"eval_runtime": 93.7406, |
|
"eval_samples_per_second": 17.57, |
|
"eval_steps_per_second": 2.198, |
|
"eval_wer": 0.4068021652538045, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 9.17, |
|
"learning_rate": 0.00016784140969162994, |
|
"loss": 0.2249, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 9.17, |
|
"eval_loss": 0.4049021899700165, |
|
"eval_runtime": 92.8281, |
|
"eval_samples_per_second": 17.742, |
|
"eval_steps_per_second": 2.219, |
|
"eval_wer": 0.38811153099785517, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 10.09, |
|
"eval_loss": 0.39933764934539795, |
|
"eval_runtime": 94.1592, |
|
"eval_samples_per_second": 17.492, |
|
"eval_steps_per_second": 2.188, |
|
"eval_wer": 0.3808599734450005, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"eval_loss": 0.38551005721092224, |
|
"eval_runtime": 93.9927, |
|
"eval_samples_per_second": 17.523, |
|
"eval_steps_per_second": 2.192, |
|
"eval_wer": 0.37820447349606784, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 11.93, |
|
"eval_loss": 0.3923419117927551, |
|
"eval_runtime": 94.4081, |
|
"eval_samples_per_second": 17.446, |
|
"eval_steps_per_second": 2.182, |
|
"eval_wer": 0.3712593197834746, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 12.84, |
|
"eval_loss": 0.3832719624042511, |
|
"eval_runtime": 93.677, |
|
"eval_samples_per_second": 17.582, |
|
"eval_steps_per_second": 2.199, |
|
"eval_wer": 0.35910530078643654, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 13.76, |
|
"learning_rate": 3.568281938325991e-05, |
|
"loss": 0.1029, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 13.76, |
|
"eval_loss": 0.3811333179473877, |
|
"eval_runtime": 93.1148, |
|
"eval_samples_per_second": 17.688, |
|
"eval_steps_per_second": 2.212, |
|
"eval_wer": 0.3569604739046063, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 14.68, |
|
"eval_loss": 0.38338083028793335, |
|
"eval_runtime": 94.0888, |
|
"eval_samples_per_second": 17.505, |
|
"eval_steps_per_second": 2.189, |
|
"eval_wer": 0.3499131855785926, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"step": 1635, |
|
"total_flos": 6.432633269893007e+18, |
|
"train_loss": 1.057601281845606, |
|
"train_runtime": 4550.4131, |
|
"train_samples_per_second": 11.465, |
|
"train_steps_per_second": 0.359 |
|
} |
|
], |
|
"max_steps": 1635, |
|
"num_train_epochs": 15, |
|
"total_flos": 6.432633269893007e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|