wavlm-large-english-phoneme / trainer_state.json
speech31's picture
initial_commit
d448bf4
raw
history blame
11.4 kB
{
"best_metric": 0.1746283918619156,
"best_model_checkpoint": "wavlm-english-phoneme/checkpoint-6500",
"epoch": 50.0,
"global_step": 6500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.77,
"learning_rate": 2.97e-05,
"loss": 4.896,
"step": 100
},
{
"epoch": 1.54,
"learning_rate": 5.97e-05,
"loss": 2.5812,
"step": 200
},
{
"epoch": 2.31,
"learning_rate": 8.969999999999998e-05,
"loss": 2.4853,
"step": 300
},
{
"epoch": 3.08,
"learning_rate": 0.0001197,
"loss": 2.2031,
"step": 400
},
{
"epoch": 3.85,
"learning_rate": 0.00014969999999999998,
"loss": 1.8587,
"step": 500
},
{
"epoch": 3.85,
"eval_cer": 0.7105220883534137,
"eval_loss": 1.3614039421081543,
"eval_runtime": 21.402,
"eval_samples_per_second": 21.587,
"eval_steps_per_second": 2.71,
"step": 500
},
{
"epoch": 4.62,
"learning_rate": 0.00017969999999999998,
"loss": 1.1164,
"step": 600
},
{
"epoch": 5.38,
"learning_rate": 0.00020969999999999997,
"loss": 0.7271,
"step": 700
},
{
"epoch": 6.15,
"learning_rate": 0.0002397,
"loss": 0.5784,
"step": 800
},
{
"epoch": 6.92,
"learning_rate": 0.0002697,
"loss": 0.4487,
"step": 900
},
{
"epoch": 7.69,
"learning_rate": 0.00029969999999999997,
"loss": 0.3517,
"step": 1000
},
{
"epoch": 7.69,
"eval_cer": 0.16610441767068274,
"eval_loss": 0.3352901339530945,
"eval_runtime": 21.5161,
"eval_samples_per_second": 21.472,
"eval_steps_per_second": 2.696,
"step": 1000
},
{
"epoch": 8.46,
"learning_rate": 0.00029459999999999995,
"loss": 0.3089,
"step": 1100
},
{
"epoch": 9.23,
"learning_rate": 0.00028914545454545454,
"loss": 0.2465,
"step": 1200
},
{
"epoch": 10.0,
"learning_rate": 0.00028369090909090907,
"loss": 0.2099,
"step": 1300
},
{
"epoch": 10.77,
"learning_rate": 0.0002782363636363636,
"loss": 0.1649,
"step": 1400
},
{
"epoch": 11.54,
"learning_rate": 0.00027278181818181813,
"loss": 0.1473,
"step": 1500
},
{
"epoch": 11.54,
"eval_cer": 0.11325301204819277,
"eval_loss": 0.23726579546928406,
"eval_runtime": 34.3746,
"eval_samples_per_second": 13.44,
"eval_steps_per_second": 1.687,
"step": 1500
},
{
"epoch": 12.31,
"learning_rate": 0.0002673272727272727,
"loss": 0.1335,
"step": 1600
},
{
"epoch": 13.08,
"learning_rate": 0.00026187272727272725,
"loss": 0.118,
"step": 1700
},
{
"epoch": 13.85,
"learning_rate": 0.00025641818181818183,
"loss": 0.1083,
"step": 1800
},
{
"epoch": 14.62,
"learning_rate": 0.00025096363636363636,
"loss": 0.106,
"step": 1900
},
{
"epoch": 15.38,
"learning_rate": 0.0002455090909090909,
"loss": 0.0799,
"step": 2000
},
{
"epoch": 15.38,
"eval_cer": 0.09397590361445783,
"eval_loss": 0.20781992375850677,
"eval_runtime": 21.3113,
"eval_samples_per_second": 21.679,
"eval_steps_per_second": 2.722,
"step": 2000
},
{
"epoch": 16.15,
"learning_rate": 0.00024005454545454545,
"loss": 0.0767,
"step": 2100
},
{
"epoch": 16.92,
"learning_rate": 0.00023459999999999998,
"loss": 0.0761,
"step": 2200
},
{
"epoch": 17.69,
"learning_rate": 0.00022914545454545454,
"loss": 0.0705,
"step": 2300
},
{
"epoch": 18.46,
"learning_rate": 0.00022369090909090907,
"loss": 0.0619,
"step": 2400
},
{
"epoch": 19.23,
"learning_rate": 0.00021823636363636363,
"loss": 0.0634,
"step": 2500
},
{
"epoch": 19.23,
"eval_cer": 0.08538152610441767,
"eval_loss": 0.20878814160823822,
"eval_runtime": 20.9398,
"eval_samples_per_second": 22.063,
"eval_steps_per_second": 2.77,
"step": 2500
},
{
"epoch": 20.0,
"learning_rate": 0.00021278181818181816,
"loss": 0.0556,
"step": 2600
},
{
"epoch": 20.77,
"learning_rate": 0.00020732727272727272,
"loss": 0.0562,
"step": 2700
},
{
"epoch": 21.54,
"learning_rate": 0.00020187272727272725,
"loss": 0.0556,
"step": 2800
},
{
"epoch": 22.31,
"learning_rate": 0.0001964181818181818,
"loss": 0.0483,
"step": 2900
},
{
"epoch": 23.08,
"learning_rate": 0.00019096363636363634,
"loss": 0.0472,
"step": 3000
},
{
"epoch": 23.08,
"eval_cer": 0.0767871485943775,
"eval_loss": 0.18513090908527374,
"eval_runtime": 21.0154,
"eval_samples_per_second": 21.984,
"eval_steps_per_second": 2.76,
"step": 3000
},
{
"epoch": 23.85,
"learning_rate": 0.00018550909090909087,
"loss": 0.044,
"step": 3100
},
{
"epoch": 24.62,
"learning_rate": 0.00018005454545454543,
"loss": 0.0409,
"step": 3200
},
{
"epoch": 25.38,
"learning_rate": 0.00017459999999999996,
"loss": 0.0386,
"step": 3300
},
{
"epoch": 26.15,
"learning_rate": 0.00016914545454545452,
"loss": 0.0397,
"step": 3400
},
{
"epoch": 26.92,
"learning_rate": 0.00016369090909090905,
"loss": 0.0337,
"step": 3500
},
{
"epoch": 26.92,
"eval_cer": 0.0757429718875502,
"eval_loss": 0.2069997787475586,
"eval_runtime": 21.3619,
"eval_samples_per_second": 21.627,
"eval_steps_per_second": 2.715,
"step": 3500
},
{
"epoch": 27.69,
"learning_rate": 0.00015823636363636364,
"loss": 0.0368,
"step": 3600
},
{
"epoch": 28.46,
"learning_rate": 0.0001527818181818182,
"loss": 0.0329,
"step": 3700
},
{
"epoch": 29.23,
"learning_rate": 0.0001473272727272727,
"loss": 0.0306,
"step": 3800
},
{
"epoch": 30.0,
"learning_rate": 0.00014187272727272726,
"loss": 0.0298,
"step": 3900
},
{
"epoch": 30.77,
"learning_rate": 0.0001364181818181818,
"loss": 0.0283,
"step": 4000
},
{
"epoch": 30.77,
"eval_cer": 0.07180722891566266,
"eval_loss": 0.19239871203899384,
"eval_runtime": 34.8631,
"eval_samples_per_second": 13.252,
"eval_steps_per_second": 1.664,
"step": 4000
},
{
"epoch": 31.54,
"learning_rate": 0.00013096363636363635,
"loss": 0.0256,
"step": 4100
},
{
"epoch": 32.31,
"learning_rate": 0.0001255090909090909,
"loss": 0.0257,
"step": 4200
},
{
"epoch": 33.08,
"learning_rate": 0.00012005454545454545,
"loss": 0.0238,
"step": 4300
},
{
"epoch": 33.85,
"learning_rate": 0.0001146,
"loss": 0.0228,
"step": 4400
},
{
"epoch": 34.62,
"learning_rate": 0.00010919999999999998,
"loss": 0.0242,
"step": 4500
},
{
"epoch": 34.62,
"eval_cer": 0.0668273092369478,
"eval_loss": 0.18180887401103973,
"eval_runtime": 20.8913,
"eval_samples_per_second": 22.115,
"eval_steps_per_second": 2.776,
"step": 4500
},
{
"epoch": 35.38,
"learning_rate": 0.00010374545454545453,
"loss": 0.0209,
"step": 4600
},
{
"epoch": 36.15,
"learning_rate": 9.829090909090907e-05,
"loss": 0.0192,
"step": 4700
},
{
"epoch": 36.92,
"learning_rate": 9.283636363636363e-05,
"loss": 0.0171,
"step": 4800
},
{
"epoch": 37.69,
"learning_rate": 8.738181818181818e-05,
"loss": 0.0205,
"step": 4900
},
{
"epoch": 38.46,
"learning_rate": 8.192727272727272e-05,
"loss": 0.0187,
"step": 5000
},
{
"epoch": 38.46,
"eval_cer": 0.06730923694779116,
"eval_loss": 0.19057846069335938,
"eval_runtime": 27.3046,
"eval_samples_per_second": 16.92,
"eval_steps_per_second": 2.124,
"step": 5000
},
{
"epoch": 39.23,
"learning_rate": 7.647272727272727e-05,
"loss": 0.0159,
"step": 5100
},
{
"epoch": 40.0,
"learning_rate": 7.101818181818181e-05,
"loss": 0.0154,
"step": 5200
},
{
"epoch": 40.77,
"learning_rate": 6.556363636363636e-05,
"loss": 0.0165,
"step": 5300
},
{
"epoch": 41.54,
"learning_rate": 6.01090909090909e-05,
"loss": 0.0135,
"step": 5400
},
{
"epoch": 42.31,
"learning_rate": 5.465454545454545e-05,
"loss": 0.0156,
"step": 5500
},
{
"epoch": 42.31,
"eval_cer": 0.06409638554216868,
"eval_loss": 0.17488864064216614,
"eval_runtime": 20.9298,
"eval_samples_per_second": 22.074,
"eval_steps_per_second": 2.771,
"step": 5500
},
{
"epoch": 43.08,
"learning_rate": 4.9199999999999997e-05,
"loss": 0.0137,
"step": 5600
},
{
"epoch": 43.85,
"learning_rate": 4.374545454545454e-05,
"loss": 0.0138,
"step": 5700
},
{
"epoch": 44.62,
"learning_rate": 3.8290909090909086e-05,
"loss": 0.0117,
"step": 5800
},
{
"epoch": 45.38,
"learning_rate": 3.283636363636364e-05,
"loss": 0.0132,
"step": 5900
},
{
"epoch": 46.15,
"learning_rate": 2.738181818181818e-05,
"loss": 0.0107,
"step": 6000
},
{
"epoch": 46.15,
"eval_cer": 0.060481927710843375,
"eval_loss": 0.17818936705589294,
"eval_runtime": 20.9013,
"eval_samples_per_second": 22.104,
"eval_steps_per_second": 2.775,
"step": 6000
},
{
"epoch": 46.92,
"learning_rate": 2.1927272727272727e-05,
"loss": 0.0124,
"step": 6100
},
{
"epoch": 47.69,
"learning_rate": 1.647272727272727e-05,
"loss": 0.0119,
"step": 6200
},
{
"epoch": 48.46,
"learning_rate": 1.1018181818181816e-05,
"loss": 0.0097,
"step": 6300
},
{
"epoch": 49.23,
"learning_rate": 5.563636363636363e-06,
"loss": 0.0105,
"step": 6400
},
{
"epoch": 50.0,
"learning_rate": 1.0909090909090908e-07,
"loss": 0.0099,
"step": 6500
},
{
"epoch": 50.0,
"eval_cer": 0.06088353413654619,
"eval_loss": 0.1746283918619156,
"eval_runtime": 27.3261,
"eval_samples_per_second": 16.907,
"eval_steps_per_second": 2.123,
"step": 6500
}
],
"max_steps": 6500,
"num_train_epochs": 50,
"total_flos": 1.985767056261625e+19,
"trial_name": null,
"trial_params": null
}