whisper-small-pashto / trainer_state.json
ihanif's picture
End of training
38e26ab
raw
history blame
3.51 kB
{
"best_metric": 240.85956416464893,
"best_model_checkpoint": "./checkpoint-100",
"epoch": 57.142857142857146,
"global_step": 400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 3.57,
"learning_rate": 2.9076923076923076e-07,
"loss": 2.8018,
"step": 25
},
{
"epoch": 7.14,
"learning_rate": 2.7153846153846153e-07,
"loss": 2.4337,
"step": 50
},
{
"epoch": 10.71,
"learning_rate": 2.523076923076923e-07,
"loss": 2.1631,
"step": 75
},
{
"epoch": 14.29,
"learning_rate": 2.3307692307692306e-07,
"loss": 1.9754,
"step": 100
},
{
"epoch": 14.29,
"eval_loss": 1.9261106252670288,
"eval_runtime": 721.539,
"eval_samples_per_second": 0.71,
"eval_steps_per_second": 0.044,
"eval_wer": 240.85956416464893,
"step": 100
},
{
"epoch": 17.86,
"learning_rate": 2.1384615384615385e-07,
"loss": 1.8067,
"step": 125
},
{
"epoch": 21.43,
"learning_rate": 1.9461538461538462e-07,
"loss": 1.7049,
"step": 150
},
{
"epoch": 25.0,
"learning_rate": 1.7538461538461539e-07,
"loss": 1.606,
"step": 175
},
{
"epoch": 28.57,
"learning_rate": 1.5615384615384615e-07,
"loss": 1.5323,
"step": 200
},
{
"epoch": 28.57,
"eval_loss": 1.5718045234680176,
"eval_runtime": 653.16,
"eval_samples_per_second": 0.784,
"eval_steps_per_second": 0.049,
"eval_wer": 168.5608353510896,
"step": 200
},
{
"epoch": 32.14,
"learning_rate": 1.3692307692307692e-07,
"loss": 1.4644,
"step": 225
},
{
"epoch": 35.71,
"learning_rate": 1.1769230769230768e-07,
"loss": 1.4134,
"step": 250
},
{
"epoch": 39.29,
"learning_rate": 9.846153846153846e-08,
"loss": 1.3706,
"step": 275
},
{
"epoch": 42.86,
"learning_rate": 7.923076923076923e-08,
"loss": 1.338,
"step": 300
},
{
"epoch": 42.86,
"eval_loss": 1.4249473810195923,
"eval_runtime": 548.9427,
"eval_samples_per_second": 0.933,
"eval_steps_per_second": 0.058,
"eval_wer": 96.64800242130751,
"step": 300
},
{
"epoch": 46.43,
"learning_rate": 6e-08,
"loss": 1.3112,
"step": 325
},
{
"epoch": 50.0,
"learning_rate": 4.076923076923077e-08,
"loss": 1.3008,
"step": 350
},
{
"epoch": 53.57,
"learning_rate": 2.1538461538461537e-08,
"loss": 1.2859,
"step": 375
},
{
"epoch": 57.14,
"learning_rate": 2.3076923076923076e-09,
"loss": 1.282,
"step": 400
},
{
"epoch": 57.14,
"eval_loss": 1.3860349655151367,
"eval_runtime": 506.783,
"eval_samples_per_second": 1.01,
"eval_steps_per_second": 0.063,
"eval_wer": 89.14951573849879,
"step": 400
},
{
"epoch": 57.14,
"step": 400,
"total_flos": 7.10814699528192e+18,
"train_loss": 1.6743954944610595,
"train_runtime": 3832.5455,
"train_samples_per_second": 6.68,
"train_steps_per_second": 0.104
}
],
"max_steps": 400,
"num_train_epochs": 58,
"total_flos": 7.10814699528192e+18,
"trial_name": null,
"trial_params": null
}