diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,29416 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 12.416802151999763, + "global_step": 84000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.01, + "learning_rate": 8.000000000000001e-07, + "loss": 4.2133, + "step": 40 + }, + { + "epoch": 0.01, + "eval_loss": 8.511882781982422, + "eval_runtime": 507.7122, + "eval_samples_per_second": 15.046, + "eval_wer": 0.6384687955630521, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 1.6000000000000001e-06, + "loss": 4.0439, + "step": 80 + }, + { + "epoch": 0.01, + "eval_loss": 8.176779747009277, + "eval_runtime": 509.0639, + "eval_samples_per_second": 15.006, + "eval_wer": 0.6322364847479917, + "step": 80 + }, + { + "epoch": 0.02, + "learning_rate": 2.4000000000000003e-06, + "loss": 3.9154, + "step": 120 + }, + { + "epoch": 0.02, + "eval_loss": 7.60866117477417, + "eval_runtime": 506.3517, + "eval_samples_per_second": 15.086, + "eval_wer": 0.6243460361931444, + "step": 120 + }, + { + "epoch": 0.02, + "learning_rate": 3.2000000000000003e-06, + "loss": 3.5183, + "step": 160 + }, + { + "epoch": 0.02, + "eval_loss": 6.876076698303223, + "eval_runtime": 505.7631, + "eval_samples_per_second": 15.104, + "eval_wer": 0.6111381114382916, + "step": 160 + }, + { + "epoch": 0.03, + "learning_rate": 4.000000000000001e-06, + "loss": 3.011, + "step": 200 + }, + { + "epoch": 0.03, + "eval_loss": 6.000689506530762, + "eval_runtime": 505.8319, + "eval_samples_per_second": 15.102, + "eval_wer": 0.5992166728608593, + "step": 200 + }, + { + "epoch": 0.04, + "learning_rate": 4.800000000000001e-06, + "loss": 2.5676, + "step": 240 + }, + { + "epoch": 0.04, + "eval_loss": 5.190187454223633, + "eval_runtime": 506.3407, + "eval_samples_per_second": 15.087, + "eval_wer": 0.5866948740672975, + "step": 240 + }, + { + "epoch": 0.04, + "learning_rate": 5.600000000000001e-06, + "loss": 2.2081, + "step": 280 + }, + { + "epoch": 0.04, + "eval_loss": 4.561764717102051, + "eval_runtime": 505.8441, + "eval_samples_per_second": 15.101, + "eval_wer": 0.5730295320049172, + "step": 280 + }, + { + "epoch": 0.05, + "learning_rate": 6.4000000000000006e-06, + "loss": 2.2183, + "step": 320 + }, + { + "epoch": 0.05, + "eval_loss": 4.161630630493164, + "eval_runtime": 506.1047, + "eval_samples_per_second": 15.094, + "eval_wer": 0.5625375225135081, + "step": 320 + }, + { + "epoch": 0.05, + "learning_rate": 7.2000000000000005e-06, + "loss": 2.001, + "step": 360 + }, + { + "epoch": 0.05, + "eval_loss": 3.9902665615081787, + "eval_runtime": 506.5931, + "eval_samples_per_second": 15.079, + "eval_wer": 0.5569913376597387, + "step": 360 + }, + { + "epoch": 0.06, + "learning_rate": 8.000000000000001e-06, + "loss": 1.9999, + "step": 400 + }, + { + "epoch": 0.06, + "eval_loss": 3.8676645755767822, + "eval_runtime": 506.5386, + "eval_samples_per_second": 15.081, + "eval_wer": 0.5517882157866149, + "step": 400 + }, + { + "epoch": 0.07, + "learning_rate": 8.8e-06, + "loss": 1.9991, + "step": 440 + }, + { + "epoch": 0.07, + "eval_loss": 3.6282665729522705, + "eval_runtime": 505.8386, + "eval_samples_per_second": 15.102, + "eval_wer": 0.5469853340575774, + "step": 440 + }, + { + "epoch": 0.07, + "learning_rate": 9.600000000000001e-06, + "loss": 2.1213, + "step": 480 + }, + { + "epoch": 0.07, + "eval_loss": 3.351651668548584, + "eval_runtime": 507.7122, + "eval_samples_per_second": 15.046, + "eval_wer": 0.5398096000457417, + "step": 480 + }, + { + "epoch": 0.08, + "learning_rate": 9.998516320474778e-06, + "loss": 1.9415, + "step": 520 + }, + { + "epoch": 0.08, + "eval_loss": 3.307413101196289, + "eval_runtime": 507.2404, + "eval_samples_per_second": 15.06, + "eval_wer": 0.5381800508876755, + "step": 520 + }, + { + "epoch": 0.08, + "learning_rate": 9.995548961424332e-06, + "loss": 1.93, + "step": 560 + }, + { + "epoch": 0.08, + "eval_loss": 3.112159252166748, + "eval_runtime": 507.2473, + "eval_samples_per_second": 15.06, + "eval_wer": 0.5326624546156266, + "step": 560 + }, + { + "epoch": 0.09, + "learning_rate": 9.992581602373887e-06, + "loss": 1.7952, + "step": 600 + }, + { + "epoch": 0.09, + "eval_loss": 3.1151227951049805, + "eval_runtime": 507.1713, + "eval_samples_per_second": 15.062, + "eval_wer": 0.5310614940392807, + "step": 600 + }, + { + "epoch": 0.09, + "learning_rate": 9.989614243323443e-06, + "loss": 1.8172, + "step": 640 + }, + { + "epoch": 0.09, + "eval_loss": 3.1644179821014404, + "eval_runtime": 508.7332, + "eval_samples_per_second": 15.016, + "eval_wer": 0.5308041968037965, + "step": 640 + }, + { + "epoch": 0.1, + "learning_rate": 9.986646884272998e-06, + "loss": 1.8188, + "step": 680 + }, + { + "epoch": 0.1, + "eval_loss": 2.9733777046203613, + "eval_runtime": 507.9635, + "eval_samples_per_second": 15.038, + "eval_wer": 0.5263443780554047, + "step": 680 + }, + { + "epoch": 0.11, + "learning_rate": 9.983679525222552e-06, + "loss": 1.8733, + "step": 720 + }, + { + "epoch": 0.11, + "eval_loss": 2.8506317138671875, + "eval_runtime": 508.1594, + "eval_samples_per_second": 15.033, + "eval_wer": 0.5224849195231425, + "step": 720 + }, + { + "epoch": 0.11, + "learning_rate": 9.980712166172108e-06, + "loss": 1.7325, + "step": 760 + }, + { + "epoch": 0.11, + "eval_loss": 2.8051726818084717, + "eval_runtime": 506.05, + "eval_samples_per_second": 15.095, + "eval_wer": 0.5203121873123875, + "step": 760 + }, + { + "epoch": 0.12, + "learning_rate": 9.977744807121663e-06, + "loss": 1.8116, + "step": 800 + }, + { + "epoch": 0.12, + "eval_loss": 2.6554903984069824, + "eval_runtime": 509.1916, + "eval_samples_per_second": 15.002, + "eval_wer": 0.5155950713285113, + "step": 800 + }, + { + "epoch": 0.12, + "learning_rate": 9.974777448071219e-06, + "loss": 1.7828, + "step": 840 + }, + { + "epoch": 0.12, + "eval_loss": 2.707118272781372, + "eval_runtime": 510.6821, + "eval_samples_per_second": 14.958, + "eval_wer": 0.5172817976500186, + "step": 840 + }, + { + "epoch": 0.13, + "learning_rate": 9.971810089020773e-06, + "loss": 1.793, + "step": 880 + }, + { + "epoch": 0.13, + "eval_loss": 2.607694149017334, + "eval_runtime": 507.9749, + "eval_samples_per_second": 15.038, + "eval_wer": 0.5136796363532405, + "step": 880 + }, + { + "epoch": 0.14, + "learning_rate": 9.968842729970328e-06, + "loss": 1.6913, + "step": 920 + }, + { + "epoch": 0.14, + "eval_loss": 2.5908613204956055, + "eval_runtime": 508.1547, + "eval_samples_per_second": 15.033, + "eval_wer": 0.5129363332285085, + "step": 920 + }, + { + "epoch": 0.14, + "learning_rate": 9.965875370919882e-06, + "loss": 1.6796, + "step": 960 + }, + { + "epoch": 0.14, + "eval_loss": 2.558162212371826, + "eval_runtime": 509.237, + "eval_samples_per_second": 15.001, + "eval_wer": 0.5112781954887218, + "step": 960 + }, + { + "epoch": 0.15, + "learning_rate": 9.962908011869436e-06, + "loss": 1.7553, + "step": 1000 + }, + { + "epoch": 0.15, + "eval_loss": 2.461369037628174, + "eval_runtime": 506.9589, + "eval_samples_per_second": 15.068, + "eval_wer": 0.5085908688069984, + "step": 1000 + }, + { + "epoch": 0.15, + "learning_rate": 9.959940652818993e-06, + "loss": 1.6965, + "step": 1040 + }, + { + "epoch": 0.15, + "eval_loss": 2.449120044708252, + "eval_runtime": 508.9931, + "eval_samples_per_second": 15.008, + "eval_wer": 0.5074759141199006, + "step": 1040 + }, + { + "epoch": 0.16, + "learning_rate": 9.956973293768547e-06, + "loss": 1.6172, + "step": 1080 + }, + { + "epoch": 0.16, + "eval_loss": 2.4614946842193604, + "eval_runtime": 508.8115, + "eval_samples_per_second": 15.013, + "eval_wer": 0.5074759141199006, + "step": 1080 + }, + { + "epoch": 0.17, + "learning_rate": 9.954005934718101e-06, + "loss": 1.6918, + "step": 1120 + }, + { + "epoch": 0.17, + "eval_loss": 2.363593578338623, + "eval_runtime": 509.119, + "eval_samples_per_second": 15.004, + "eval_wer": 0.5030160953715086, + "step": 1120 + }, + { + "epoch": 0.17, + "learning_rate": 9.951038575667656e-06, + "loss": 1.7333, + "step": 1160 + }, + { + "epoch": 0.17, + "eval_loss": 2.273185968399048, + "eval_runtime": 508.3618, + "eval_samples_per_second": 15.027, + "eval_wer": 0.49941393407473056, + "step": 1160 + }, + { + "epoch": 0.18, + "learning_rate": 9.94807121661721e-06, + "loss": 1.6648, + "step": 1200 + }, + { + "epoch": 0.18, + "eval_loss": 2.290827989578247, + "eval_runtime": 508.8109, + "eval_samples_per_second": 15.013, + "eval_wer": 0.4985848652048372, + "step": 1200 + }, + { + "epoch": 0.18, + "learning_rate": 9.945103857566766e-06, + "loss": 1.6576, + "step": 1240 + }, + { + "epoch": 0.18, + "eval_loss": 2.26701283454895, + "eval_runtime": 509.3143, + "eval_samples_per_second": 14.999, + "eval_wer": 0.49718402470053463, + "step": 1240 + }, + { + "epoch": 0.19, + "learning_rate": 9.942136498516321e-06, + "loss": 1.68, + "step": 1280 + }, + { + "epoch": 0.19, + "eval_loss": 2.2503156661987305, + "eval_runtime": 508.9511, + "eval_samples_per_second": 15.009, + "eval_wer": 0.49489693816289776, + "step": 1280 + }, + { + "epoch": 0.2, + "learning_rate": 9.939169139465877e-06, + "loss": 1.5679, + "step": 1320 + }, + { + "epoch": 0.2, + "eval_loss": 2.266763210296631, + "eval_runtime": 509.3455, + "eval_samples_per_second": 14.998, + "eval_wer": 0.49486834958117726, + "step": 1320 + }, + { + "epoch": 0.2, + "learning_rate": 9.936201780415431e-06, + "loss": 1.5697, + "step": 1360 + }, + { + "epoch": 0.2, + "eval_loss": 2.2245819568634033, + "eval_runtime": 510.0642, + "eval_samples_per_second": 14.977, + "eval_wer": 0.49326738900483147, + "step": 1360 + }, + { + "epoch": 0.21, + "learning_rate": 9.933234421364986e-06, + "loss": 1.6732, + "step": 1400 + }, + { + "epoch": 0.21, + "eval_loss": 2.180576801300049, + "eval_runtime": 509.3452, + "eval_samples_per_second": 14.998, + "eval_wer": 0.4915806626833243, + "step": 1400 + }, + { + "epoch": 0.21, + "learning_rate": 9.930267062314542e-06, + "loss": 1.5137, + "step": 1440 + }, + { + "epoch": 0.21, + "eval_loss": 2.2087972164154053, + "eval_runtime": 510.3773, + "eval_samples_per_second": 14.967, + "eval_wer": 0.492867148860745, + "step": 1440 + }, + { + "epoch": 0.22, + "learning_rate": 9.927299703264097e-06, + "loss": 1.5327, + "step": 1480 + }, + { + "epoch": 0.22, + "eval_loss": 2.1999690532684326, + "eval_runtime": 510.0032, + "eval_samples_per_second": 14.978, + "eval_wer": 0.49172360559192657, + "step": 1480 + }, + { + "epoch": 0.22, + "learning_rate": 9.924332344213651e-06, + "loss": 1.6258, + "step": 1520 + }, + { + "epoch": 0.22, + "eval_loss": 2.13869047164917, + "eval_runtime": 513.3934, + "eval_samples_per_second": 14.879, + "eval_wer": 0.48923639898224647, + "step": 1520 + }, + { + "epoch": 0.23, + "learning_rate": 9.921364985163205e-06, + "loss": 1.6906, + "step": 1560 + }, + { + "epoch": 0.23, + "eval_loss": 2.1670727729797363, + "eval_runtime": 508.7612, + "eval_samples_per_second": 15.015, + "eval_wer": 0.4893793418908488, + "step": 1560 + }, + { + "epoch": 0.24, + "learning_rate": 9.91839762611276e-06, + "loss": 1.5288, + "step": 1600 + }, + { + "epoch": 0.24, + "eval_loss": 2.1631860733032227, + "eval_runtime": 511.7308, + "eval_samples_per_second": 14.928, + "eval_wer": 0.48915063323708513, + "step": 1600 + }, + { + "epoch": 0.24, + "learning_rate": 9.915430267062314e-06, + "loss": 1.5986, + "step": 1640 + }, + { + "epoch": 0.24, + "eval_loss": 2.103747844696045, + "eval_runtime": 514.6938, + "eval_samples_per_second": 14.842, + "eval_wer": 0.4867206037908459, + "step": 1640 + }, + { + "epoch": 0.25, + "learning_rate": 9.91246290801187e-06, + "loss": 1.5171, + "step": 1680 + }, + { + "epoch": 0.25, + "eval_loss": 2.10674786567688, + "eval_runtime": 509.0977, + "eval_samples_per_second": 15.005, + "eval_wer": 0.4861774207381572, + "step": 1680 + }, + { + "epoch": 0.25, + "learning_rate": 9.909495548961425e-06, + "loss": 1.7026, + "step": 1720 + }, + { + "epoch": 0.25, + "eval_loss": 2.0203464031219482, + "eval_runtime": 510.2686, + "eval_samples_per_second": 14.971, + "eval_wer": 0.48391892278224075, + "step": 1720 + }, + { + "epoch": 0.26, + "learning_rate": 9.90652818991098e-06, + "loss": 1.6435, + "step": 1760 + }, + { + "epoch": 0.26, + "eval_loss": 2.00274920463562, + "eval_runtime": 512.9086, + "eval_samples_per_second": 14.893, + "eval_wer": 0.48357585980159523, + "step": 1760 + }, + { + "epoch": 0.27, + "learning_rate": 9.903560830860535e-06, + "loss": 1.627, + "step": 1800 + }, + { + "epoch": 0.27, + "eval_loss": 2.012718915939331, + "eval_runtime": 510.036, + "eval_samples_per_second": 14.977, + "eval_wer": 0.4840618656908431, + "step": 1800 + }, + { + "epoch": 0.27, + "learning_rate": 9.90059347181009e-06, + "loss": 1.6283, + "step": 1840 + }, + { + "epoch": 0.27, + "eval_loss": 1.9829087257385254, + "eval_runtime": 510.6865, + "eval_samples_per_second": 14.958, + "eval_wer": 0.4816890134080448, + "step": 1840 + }, + { + "epoch": 0.28, + "learning_rate": 9.897626112759644e-06, + "loss": 1.6398, + "step": 1880 + }, + { + "epoch": 0.28, + "eval_loss": 2.0142433643341064, + "eval_runtime": 510.7641, + "eval_samples_per_second": 14.956, + "eval_wer": 0.48377597987363846, + "step": 1880 + }, + { + "epoch": 0.28, + "learning_rate": 9.8946587537092e-06, + "loss": 1.4638, + "step": 1920 + }, + { + "epoch": 0.28, + "eval_loss": 2.0483970642089844, + "eval_runtime": 510.6351, + "eval_samples_per_second": 14.96, + "eval_wer": 0.4842619857628863, + "step": 1920 + }, + { + "epoch": 0.29, + "learning_rate": 9.891691394658755e-06, + "loss": 1.5916, + "step": 1960 + }, + { + "epoch": 0.29, + "eval_loss": 1.926328182220459, + "eval_runtime": 510.8635, + "eval_samples_per_second": 14.953, + "eval_wer": 0.47934474970696705, + "step": 1960 + }, + { + "epoch": 0.3, + "learning_rate": 9.88872403560831e-06, + "loss": 1.5755, + "step": 2000 + }, + { + "epoch": 0.3, + "eval_loss": 1.8705726861953735, + "eval_runtime": 510.9855, + "eval_samples_per_second": 14.95, + "eval_wer": 0.4770576631693302, + "step": 2000 + }, + { + "epoch": 0.3, + "learning_rate": 9.885756676557864e-06, + "loss": 1.497, + "step": 2040 + }, + { + "epoch": 0.3, + "eval_loss": 1.9062929153442383, + "eval_runtime": 510.421, + "eval_samples_per_second": 14.966, + "eval_wer": 0.4775722576402985, + "step": 2040 + }, + { + "epoch": 0.31, + "learning_rate": 9.88278931750742e-06, + "loss": 1.4912, + "step": 2080 + }, + { + "epoch": 0.31, + "eval_loss": 1.8141084909439087, + "eval_runtime": 510.423, + "eval_samples_per_second": 14.966, + "eval_wer": 0.4730552617284656, + "step": 2080 + }, + { + "epoch": 0.31, + "learning_rate": 9.879821958456974e-06, + "loss": 1.5281, + "step": 2120 + }, + { + "epoch": 0.31, + "eval_loss": 1.89003324508667, + "eval_runtime": 509.8664, + "eval_samples_per_second": 14.982, + "eval_wer": 0.4777437891306212, + "step": 2120 + }, + { + "epoch": 0.32, + "learning_rate": 9.876854599406529e-06, + "loss": 1.6475, + "step": 2160 + }, + { + "epoch": 0.32, + "eval_loss": 1.8485099077224731, + "eval_runtime": 510.3708, + "eval_samples_per_second": 14.968, + "eval_wer": 0.4757139998284685, + "step": 2160 + }, + { + "epoch": 0.33, + "learning_rate": 9.873887240356083e-06, + "loss": 1.5952, + "step": 2200 + }, + { + "epoch": 0.33, + "eval_loss": 1.8507680892944336, + "eval_runtime": 510.5091, + "eval_samples_per_second": 14.963, + "eval_wer": 0.47557105691986623, + "step": 2200 + }, + { + "epoch": 0.33, + "learning_rate": 9.870919881305638e-06, + "loss": 1.5251, + "step": 2240 + }, + { + "epoch": 0.33, + "eval_loss": 1.8981126546859741, + "eval_runtime": 514.4598, + "eval_samples_per_second": 14.849, + "eval_wer": 0.4780868521112668, + "step": 2240 + }, + { + "epoch": 0.34, + "learning_rate": 9.867952522255194e-06, + "loss": 1.533, + "step": 2280 + }, + { + "epoch": 0.34, + "eval_loss": 1.8121381998062134, + "eval_runtime": 510.3935, + "eval_samples_per_second": 14.967, + "eval_wer": 0.47376997627147716, + "step": 2280 + }, + { + "epoch": 0.34, + "learning_rate": 9.864985163204748e-06, + "loss": 1.4825, + "step": 2320 + }, + { + "epoch": 0.34, + "eval_loss": 1.8304731845855713, + "eval_runtime": 510.5128, + "eval_samples_per_second": 14.963, + "eval_wer": 0.4722261928585723, + "step": 2320 + }, + { + "epoch": 0.35, + "learning_rate": 9.862017804154303e-06, + "loss": 1.5538, + "step": 2360 + }, + { + "epoch": 0.35, + "eval_loss": 1.8135722875595093, + "eval_runtime": 513.8497, + "eval_samples_per_second": 14.866, + "eval_wer": 0.4716830098058835, + "step": 2360 + }, + { + "epoch": 0.35, + "learning_rate": 9.859050445103859e-06, + "loss": 1.5597, + "step": 2400 + }, + { + "epoch": 0.35, + "eval_loss": 1.7757524251937866, + "eval_runtime": 511.0956, + "eval_samples_per_second": 14.946, + "eval_wer": 0.46968180908545126, + "step": 2400 + }, + { + "epoch": 0.36, + "learning_rate": 9.856083086053413e-06, + "loss": 1.5297, + "step": 2440 + }, + { + "epoch": 0.36, + "eval_loss": 1.828170895576477, + "eval_runtime": 510.8652, + "eval_samples_per_second": 14.953, + "eval_wer": 0.47342691329083164, + "step": 2440 + }, + { + "epoch": 0.37, + "learning_rate": 9.85311572700297e-06, + "loss": 1.5557, + "step": 2480 + }, + { + "epoch": 0.37, + "eval_loss": 1.8002945184707642, + "eval_runtime": 511.4369, + "eval_samples_per_second": 14.936, + "eval_wer": 0.47268361016609967, + "step": 2480 + }, + { + "epoch": 0.37, + "learning_rate": 9.850148367952524e-06, + "loss": 1.5349, + "step": 2520 + }, + { + "epoch": 0.37, + "eval_loss": 1.73868727684021, + "eval_runtime": 511.4155, + "eval_samples_per_second": 14.937, + "eval_wer": 0.46753766545641673, + "step": 2520 + }, + { + "epoch": 0.38, + "learning_rate": 9.847181008902078e-06, + "loss": 1.4815, + "step": 2560 + }, + { + "epoch": 0.38, + "eval_loss": 1.7303557395935059, + "eval_runtime": 511.8251, + "eval_samples_per_second": 14.925, + "eval_wer": 0.46779496269190085, + "step": 2560 + }, + { + "epoch": 0.38, + "learning_rate": 9.844213649851633e-06, + "loss": 1.5265, + "step": 2600 + }, + { + "epoch": 0.38, + "eval_loss": 1.675964117050171, + "eval_runtime": 511.9187, + "eval_samples_per_second": 14.922, + "eval_wer": 0.4655650533177049, + "step": 2600 + }, + { + "epoch": 0.39, + "learning_rate": 9.841246290801187e-06, + "loss": 1.5675, + "step": 2640 + }, + { + "epoch": 0.39, + "eval_loss": 1.6297857761383057, + "eval_runtime": 512.5309, + "eval_samples_per_second": 14.904, + "eval_wer": 0.4627919608908202, + "step": 2640 + }, + { + "epoch": 0.4, + "learning_rate": 9.838278931750742e-06, + "loss": 1.4947, + "step": 2680 + }, + { + "epoch": 0.4, + "eval_loss": 1.6822654008865356, + "eval_runtime": 511.6877, + "eval_samples_per_second": 14.929, + "eval_wer": 0.464392921467166, + "step": 2680 + }, + { + "epoch": 0.4, + "learning_rate": 9.835311572700298e-06, + "loss": 1.493, + "step": 2720 + }, + { + "epoch": 0.4, + "eval_loss": 1.754394769668579, + "eval_runtime": 511.3075, + "eval_samples_per_second": 14.94, + "eval_wer": 0.46868120872523517, + "step": 2720 + }, + { + "epoch": 0.41, + "learning_rate": 9.832344213649852e-06, + "loss": 1.5664, + "step": 2760 + }, + { + "epoch": 0.41, + "eval_loss": 1.6030182838439941, + "eval_runtime": 513.0607, + "eval_samples_per_second": 14.889, + "eval_wer": 0.4596472169015695, + "step": 2760 + }, + { + "epoch": 0.41, + "learning_rate": 9.829376854599407e-06, + "loss": 1.5427, + "step": 2800 + }, + { + "epoch": 0.41, + "eval_loss": 1.7321422100067139, + "eval_runtime": 511.9465, + "eval_samples_per_second": 14.921, + "eval_wer": 0.4665942422596415, + "step": 2800 + }, + { + "epoch": 0.42, + "learning_rate": 9.826409495548963e-06, + "loss": 1.4226, + "step": 2840 + }, + { + "epoch": 0.42, + "eval_loss": 1.6753013134002686, + "eval_runtime": 511.8285, + "eval_samples_per_second": 14.925, + "eval_wer": 0.46284913805426114, + "step": 2840 + }, + { + "epoch": 0.43, + "learning_rate": 9.823442136498517e-06, + "loss": 1.3667, + "step": 2880 + }, + { + "epoch": 0.43, + "eval_loss": 1.69732666015625, + "eval_runtime": 512.7551, + "eval_samples_per_second": 14.898, + "eval_wer": 0.4631350238714657, + "step": 2880 + }, + { + "epoch": 0.43, + "learning_rate": 9.820474777448072e-06, + "loss": 1.4723, + "step": 2920 + }, + { + "epoch": 0.43, + "eval_loss": 1.6817669868469238, + "eval_runtime": 512.1768, + "eval_samples_per_second": 14.915, + "eval_wer": 0.46121958889619485, + "step": 2920 + }, + { + "epoch": 0.44, + "learning_rate": 9.817507418397628e-06, + "loss": 1.5479, + "step": 2960 + }, + { + "epoch": 0.44, + "eval_loss": 1.6193170547485352, + "eval_runtime": 511.9305, + "eval_samples_per_second": 14.922, + "eval_wer": 0.45824637639726695, + "step": 2960 + }, + { + "epoch": 0.44, + "learning_rate": 9.814540059347182e-06, + "loss": 1.4255, + "step": 3000 + }, + { + "epoch": 0.44, + "eval_loss": 1.6400399208068848, + "eval_runtime": 511.1765, + "eval_samples_per_second": 14.944, + "eval_wer": 0.4589610909402784, + "step": 3000 + }, + { + "epoch": 0.45, + "learning_rate": 9.811572700296737e-06, + "loss": 1.4461, + "step": 3040 + }, + { + "epoch": 0.45, + "eval_loss": 1.6966502666473389, + "eval_runtime": 512.4424, + "eval_samples_per_second": 14.907, + "eval_wer": 0.46061922868006516, + "step": 3040 + }, + { + "epoch": 0.46, + "learning_rate": 9.808605341246291e-06, + "loss": 1.498, + "step": 3080 + }, + { + "epoch": 0.46, + "eval_loss": 1.62920343875885, + "eval_runtime": 512.351, + "eval_samples_per_second": 14.91, + "eval_wer": 0.4585322622144715, + "step": 3080 + }, + { + "epoch": 0.46, + "learning_rate": 9.805637982195847e-06, + "loss": 1.4714, + "step": 3120 + }, + { + "epoch": 0.46, + "eval_loss": 1.560744047164917, + "eval_runtime": 512.4371, + "eval_samples_per_second": 14.907, + "eval_wer": 0.4551873981531776, + "step": 3120 + }, + { + "epoch": 0.47, + "learning_rate": 9.802670623145402e-06, + "loss": 1.4213, + "step": 3160 + }, + { + "epoch": 0.47, + "eval_loss": 1.6912263631820679, + "eval_runtime": 512.5177, + "eval_samples_per_second": 14.905, + "eval_wer": 0.4617913605306041, + "step": 3160 + }, + { + "epoch": 0.47, + "learning_rate": 9.799703264094956e-06, + "loss": 1.531, + "step": 3200 + }, + { + "epoch": 0.47, + "eval_loss": 1.5711145401000977, + "eval_runtime": 512.78, + "eval_samples_per_second": 14.897, + "eval_wer": 0.4538151462305955, + "step": 3200 + }, + { + "epoch": 0.48, + "learning_rate": 9.79673590504451e-06, + "loss": 1.4855, + "step": 3240 + }, + { + "epoch": 0.48, + "eval_loss": 1.596936821937561, + "eval_runtime": 513.6738, + "eval_samples_per_second": 14.871, + "eval_wer": 0.45524457531661855, + "step": 3240 + }, + { + "epoch": 0.48, + "learning_rate": 9.793768545994065e-06, + "loss": 1.5223, + "step": 3280 + }, + { + "epoch": 0.48, + "eval_loss": 1.6045000553131104, + "eval_runtime": 513.5544, + "eval_samples_per_second": 14.875, + "eval_wer": 0.45618799851339376, + "step": 3280 + }, + { + "epoch": 0.49, + "learning_rate": 9.790801186943621e-06, + "loss": 1.4955, + "step": 3320 + }, + { + "epoch": 0.49, + "eval_loss": 1.5930547714233398, + "eval_runtime": 513.492, + "eval_samples_per_second": 14.877, + "eval_wer": 0.45421538637468195, + "step": 3320 + }, + { + "epoch": 0.5, + "learning_rate": 9.787833827893176e-06, + "loss": 1.4155, + "step": 3360 + }, + { + "epoch": 0.5, + "eval_loss": 1.6870766878128052, + "eval_runtime": 512.2954, + "eval_samples_per_second": 14.911, + "eval_wer": 0.4597329826467309, + "step": 3360 + }, + { + "epoch": 0.5, + "learning_rate": 9.78486646884273e-06, + "loss": 1.4564, + "step": 3400 + }, + { + "epoch": 0.5, + "eval_loss": 1.6465580463409424, + "eval_runtime": 513.0267, + "eval_samples_per_second": 14.89, + "eval_wer": 0.4583607307241488, + "step": 3400 + }, + { + "epoch": 0.51, + "learning_rate": 9.781899109792286e-06, + "loss": 1.519, + "step": 3440 + }, + { + "epoch": 0.51, + "eval_loss": 1.5829496383666992, + "eval_runtime": 512.8231, + "eval_samples_per_second": 14.896, + "eval_wer": 0.45438691786500474, + "step": 3440 + }, + { + "epoch": 0.51, + "learning_rate": 9.77893175074184e-06, + "loss": 1.4322, + "step": 3480 + }, + { + "epoch": 0.51, + "eval_loss": 1.5679658651351929, + "eval_runtime": 513.2794, + "eval_samples_per_second": 14.883, + "eval_wer": 0.4531576088510249, + "step": 3480 + }, + { + "epoch": 0.52, + "learning_rate": 9.775964391691397e-06, + "loss": 1.5055, + "step": 3520 + }, + { + "epoch": 0.52, + "eval_loss": 1.5032811164855957, + "eval_runtime": 512.7639, + "eval_samples_per_second": 14.898, + "eval_wer": 0.44975556762629004, + "step": 3520 + }, + { + "epoch": 0.53, + "learning_rate": 9.772997032640951e-06, + "loss": 1.4672, + "step": 3560 + }, + { + "epoch": 0.53, + "eval_loss": 1.573556661605835, + "eval_runtime": 513.0365, + "eval_samples_per_second": 14.89, + "eval_wer": 0.4522999513994111, + "step": 3560 + }, + { + "epoch": 0.53, + "learning_rate": 9.770029673590506e-06, + "loss": 1.4754, + "step": 3600 + }, + { + "epoch": 0.53, + "eval_loss": 1.6171257495880127, + "eval_runtime": 513.3264, + "eval_samples_per_second": 14.881, + "eval_wer": 0.45515880957145716, + "step": 3600 + }, + { + "epoch": 0.54, + "learning_rate": 9.76706231454006e-06, + "loss": 1.4826, + "step": 3640 + }, + { + "epoch": 0.54, + "eval_loss": 1.506168007850647, + "eval_runtime": 512.9716, + "eval_samples_per_second": 14.892, + "eval_wer": 0.4494982703908059, + "step": 3640 + }, + { + "epoch": 0.54, + "learning_rate": 9.764094955489615e-06, + "loss": 1.3979, + "step": 3680 + }, + { + "epoch": 0.54, + "eval_loss": 1.6118969917297363, + "eval_runtime": 514.4538, + "eval_samples_per_second": 14.849, + "eval_wer": 0.4547013922639298, + "step": 3680 + }, + { + "epoch": 0.55, + "learning_rate": 9.761127596439169e-06, + "loss": 1.5158, + "step": 3720 + }, + { + "epoch": 0.55, + "eval_loss": 1.5075455904006958, + "eval_runtime": 513.7055, + "eval_samples_per_second": 14.87, + "eval_wer": 0.449069441664999, + "step": 3720 + }, + { + "epoch": 0.56, + "learning_rate": 9.758160237388725e-06, + "loss": 1.5191, + "step": 3760 + }, + { + "epoch": 0.56, + "eval_loss": 1.5338021516799927, + "eval_runtime": 513.4855, + "eval_samples_per_second": 14.877, + "eval_wer": 0.45069899082306525, + "step": 3760 + }, + { + "epoch": 0.56, + "learning_rate": 9.75519287833828e-06, + "loss": 1.3889, + "step": 3800 + }, + { + "epoch": 0.56, + "eval_loss": 1.5285530090332031, + "eval_runtime": 512.5198, + "eval_samples_per_second": 14.905, + "eval_wer": 0.4493553274822036, + "step": 3800 + }, + { + "epoch": 0.57, + "learning_rate": 9.752225519287834e-06, + "loss": 1.4135, + "step": 3840 + }, + { + "epoch": 0.57, + "eval_loss": 1.5430896282196045, + "eval_runtime": 514.1839, + "eval_samples_per_second": 14.857, + "eval_wer": 0.4491266188284399, + "step": 3840 + }, + { + "epoch": 0.57, + "learning_rate": 9.749258160237388e-06, + "loss": 1.3764, + "step": 3880 + }, + { + "epoch": 0.57, + "eval_loss": 1.5497621297836304, + "eval_runtime": 513.3649, + "eval_samples_per_second": 14.88, + "eval_wer": 0.449069441664999, + "step": 3880 + }, + { + "epoch": 0.58, + "learning_rate": 9.746290801186945e-06, + "loss": 1.4534, + "step": 3920 + }, + { + "epoch": 0.58, + "eval_loss": 1.540468692779541, + "eval_runtime": 515.1682, + "eval_samples_per_second": 14.828, + "eval_wer": 0.4481831956316647, + "step": 3920 + }, + { + "epoch": 0.59, + "learning_rate": 9.743323442136499e-06, + "loss": 1.4373, + "step": 3960 + }, + { + "epoch": 0.59, + "eval_loss": 1.5205267667770386, + "eval_runtime": 512.5519, + "eval_samples_per_second": 14.904, + "eval_wer": 0.44626776065639384, + "step": 3960 + }, + { + "epoch": 0.59, + "learning_rate": 9.740356083086055e-06, + "loss": 1.455, + "step": 4000 + }, + { + "epoch": 0.59, + "eval_loss": 1.4752908945083618, + "eval_runtime": 513.9628, + "eval_samples_per_second": 14.863, + "eval_wer": 0.4435232568112296, + "step": 4000 + }, + { + "epoch": 0.6, + "learning_rate": 9.73738872403561e-06, + "loss": 1.521, + "step": 4040 + }, + { + "epoch": 0.6, + "eval_loss": 1.4031436443328857, + "eval_runtime": 512.9768, + "eval_samples_per_second": 14.892, + "eval_wer": 0.4400640384230538, + "step": 4040 + }, + { + "epoch": 0.6, + "learning_rate": 9.734421364985164e-06, + "loss": 1.4567, + "step": 4080 + }, + { + "epoch": 0.6, + "eval_loss": 1.422682762145996, + "eval_runtime": 514.1822, + "eval_samples_per_second": 14.857, + "eval_wer": 0.4416364104176792, + "step": 4080 + }, + { + "epoch": 0.61, + "learning_rate": 9.731454005934718e-06, + "loss": 1.539, + "step": 4120 + }, + { + "epoch": 0.61, + "eval_loss": 1.465431571006775, + "eval_runtime": 514.4797, + "eval_samples_per_second": 14.848, + "eval_wer": 0.444352325681123, + "step": 4120 + }, + { + "epoch": 0.61, + "learning_rate": 9.728486646884275e-06, + "loss": 1.4136, + "step": 4160 + }, + { + "epoch": 0.61, + "eval_loss": 1.4815162420272827, + "eval_runtime": 513.5145, + "eval_samples_per_second": 14.876, + "eval_wer": 0.4444095028445639, + "step": 4160 + }, + { + "epoch": 0.62, + "learning_rate": 9.725519287833829e-06, + "loss": 1.4708, + "step": 4200 + }, + { + "epoch": 0.62, + "eval_loss": 1.474371314048767, + "eval_runtime": 516.7645, + "eval_samples_per_second": 14.782, + "eval_wer": 0.4438091426284342, + "step": 4200 + }, + { + "epoch": 0.63, + "learning_rate": 9.722551928783383e-06, + "loss": 1.3458, + "step": 4240 + }, + { + "epoch": 0.63, + "eval_loss": 1.5466420650482178, + "eval_runtime": 514.6222, + "eval_samples_per_second": 14.844, + "eval_wer": 0.44746848108865317, + "step": 4240 + }, + { + "epoch": 0.63, + "learning_rate": 9.719584569732938e-06, + "loss": 1.3715, + "step": 4280 + }, + { + "epoch": 0.63, + "eval_loss": 1.463120937347412, + "eval_runtime": 513.3837, + "eval_samples_per_second": 14.88, + "eval_wer": 0.442865719431659, + "step": 4280 + }, + { + "epoch": 0.64, + "learning_rate": 9.716617210682492e-06, + "loss": 1.4154, + "step": 4320 + }, + { + "epoch": 0.64, + "eval_loss": 1.486952543258667, + "eval_runtime": 513.3815, + "eval_samples_per_second": 14.88, + "eval_wer": 0.4452099831327368, + "step": 4320 + }, + { + "epoch": 0.64, + "learning_rate": 9.713649851632049e-06, + "loss": 1.3751, + "step": 4360 + }, + { + "epoch": 0.64, + "eval_loss": 1.4923511743545532, + "eval_runtime": 515.3881, + "eval_samples_per_second": 14.822, + "eval_wer": 0.4452957488778982, + "step": 4360 + }, + { + "epoch": 0.65, + "learning_rate": 9.710682492581603e-06, + "loss": 1.4758, + "step": 4400 + }, + { + "epoch": 0.65, + "eval_loss": 1.4749441146850586, + "eval_runtime": 514.9061, + "eval_samples_per_second": 14.836, + "eval_wer": 0.44455244575316616, + "step": 4400 + }, + { + "epoch": 0.66, + "learning_rate": 9.707715133531157e-06, + "loss": 1.4697, + "step": 4440 + }, + { + "epoch": 0.66, + "eval_loss": 1.3999656438827515, + "eval_runtime": 514.1094, + "eval_samples_per_second": 14.859, + "eval_wer": 0.4402355699133766, + "step": 4440 + }, + { + "epoch": 0.66, + "learning_rate": 9.704747774480714e-06, + "loss": 1.4336, + "step": 4480 + }, + { + "epoch": 0.66, + "eval_loss": 1.443965196609497, + "eval_runtime": 513.638, + "eval_samples_per_second": 14.872, + "eval_wer": 0.44123617027359274, + "step": 4480 + }, + { + "epoch": 0.67, + "learning_rate": 9.701780415430268e-06, + "loss": 1.371, + "step": 4520 + }, + { + "epoch": 0.67, + "eval_loss": 1.4547443389892578, + "eval_runtime": 515.6026, + "eval_samples_per_second": 14.816, + "eval_wer": 0.44115040452843135, + "step": 4520 + }, + { + "epoch": 0.67, + "learning_rate": 9.698813056379824e-06, + "loss": 1.4866, + "step": 4560 + }, + { + "epoch": 0.67, + "eval_loss": 1.3573508262634277, + "eval_runtime": 514.1535, + "eval_samples_per_second": 14.857, + "eval_wer": 0.4361474027273507, + "step": 4560 + }, + { + "epoch": 0.68, + "learning_rate": 9.695845697329379e-06, + "loss": 1.3148, + "step": 4600 + }, + { + "epoch": 0.68, + "eval_loss": 1.4772440195083618, + "eval_runtime": 514.9078, + "eval_samples_per_second": 14.836, + "eval_wer": 0.44223677063380884, + "step": 4600 + }, + { + "epoch": 0.69, + "learning_rate": 9.692878338278933e-06, + "loss": 1.4019, + "step": 4640 + }, + { + "epoch": 0.69, + "eval_loss": 1.4322845935821533, + "eval_runtime": 516.1706, + "eval_samples_per_second": 14.799, + "eval_wer": 0.4382915463563853, + "step": 4640 + }, + { + "epoch": 0.69, + "learning_rate": 9.689910979228487e-06, + "loss": 1.3301, + "step": 4680 + }, + { + "epoch": 0.69, + "eval_loss": 1.469238042831421, + "eval_runtime": 514.6099, + "eval_samples_per_second": 14.844, + "eval_wer": 0.4401783927499357, + "step": 4680 + }, + { + "epoch": 0.7, + "learning_rate": 9.686943620178042e-06, + "loss": 1.3722, + "step": 4720 + }, + { + "epoch": 0.7, + "eval_loss": 1.4200299978256226, + "eval_runtime": 514.4814, + "eval_samples_per_second": 14.848, + "eval_wer": 0.4367477629434804, + "step": 4720 + }, + { + "epoch": 0.7, + "learning_rate": 9.683976261127596e-06, + "loss": 1.5306, + "step": 4760 + }, + { + "epoch": 0.7, + "eval_loss": 1.4061706066131592, + "eval_runtime": 515.7464, + "eval_samples_per_second": 14.812, + "eval_wer": 0.4358901054918666, + "step": 4760 + }, + { + "epoch": 0.71, + "learning_rate": 9.681008902077152e-06, + "loss": 1.4243, + "step": 4800 + }, + { + "epoch": 0.71, + "eval_loss": 1.4921140670776367, + "eval_runtime": 516.7076, + "eval_samples_per_second": 14.784, + "eval_wer": 0.441379113182195, + "step": 4800 + }, + { + "epoch": 0.72, + "learning_rate": 9.678041543026707e-06, + "loss": 1.3804, + "step": 4840 + }, + { + "epoch": 0.72, + "eval_loss": 1.4785774946212769, + "eval_runtime": 514.972, + "eval_samples_per_second": 14.834, + "eval_wer": 0.4409216958746677, + "step": 4840 + }, + { + "epoch": 0.72, + "learning_rate": 9.675074183976261e-06, + "loss": 1.3578, + "step": 4880 + }, + { + "epoch": 0.72, + "eval_loss": 1.4605354070663452, + "eval_runtime": 515.3858, + "eval_samples_per_second": 14.822, + "eval_wer": 0.4383487235198262, + "step": 4880 + }, + { + "epoch": 0.73, + "learning_rate": 9.672106824925816e-06, + "loss": 1.5268, + "step": 4920 + }, + { + "epoch": 0.73, + "eval_loss": 1.3747655153274536, + "eval_runtime": 517.8275, + "eval_samples_per_second": 14.752, + "eval_wer": 0.4333171331370251, + "step": 4920 + }, + { + "epoch": 0.73, + "learning_rate": 9.669139465875372e-06, + "loss": 1.3945, + "step": 4960 + }, + { + "epoch": 0.73, + "eval_loss": 1.4661548137664795, + "eval_runtime": 516.6681, + "eval_samples_per_second": 14.785, + "eval_wer": 0.4394065010434832, + "step": 4960 + }, + { + "epoch": 0.74, + "learning_rate": 9.666172106824926e-06, + "loss": 1.3763, + "step": 5000 + }, + { + "epoch": 0.74, + "eval_loss": 1.4231951236724854, + "eval_runtime": 519.2986, + "eval_samples_per_second": 14.71, + "eval_wer": 0.4353469224391778, + "step": 5000 + }, + { + "epoch": 0.74, + "learning_rate": 9.663204747774482e-06, + "loss": 1.418, + "step": 5040 + }, + { + "epoch": 0.74, + "eval_loss": 1.3683183193206787, + "eval_runtime": 515.8341, + "eval_samples_per_second": 14.809, + "eval_wer": 0.4320592355413248, + "step": 5040 + }, + { + "epoch": 0.75, + "learning_rate": 9.660237388724037e-06, + "loss": 1.3425, + "step": 5080 + }, + { + "epoch": 0.75, + "eval_loss": 1.4367696046829224, + "eval_runtime": 514.9922, + "eval_samples_per_second": 14.833, + "eval_wer": 0.4359758712370279, + "step": 5080 + }, + { + "epoch": 0.76, + "learning_rate": 9.657270029673591e-06, + "loss": 1.3999, + "step": 5120 + }, + { + "epoch": 0.76, + "eval_loss": 1.4469764232635498, + "eval_runtime": 516.3669, + "eval_samples_per_second": 14.794, + "eval_wer": 0.4372623574144487, + "step": 5120 + }, + { + "epoch": 0.76, + "learning_rate": 9.654302670623146e-06, + "loss": 1.3089, + "step": 5160 + }, + { + "epoch": 0.76, + "eval_loss": 1.4533969163894653, + "eval_runtime": 516.115, + "eval_samples_per_second": 14.801, + "eval_wer": 0.4364046999628348, + "step": 5160 + }, + { + "epoch": 0.77, + "learning_rate": 9.651335311572702e-06, + "loss": 1.3404, + "step": 5200 + }, + { + "epoch": 0.77, + "eval_loss": 1.421602487564087, + "eval_runtime": 516.128, + "eval_samples_per_second": 14.801, + "eval_wer": 0.43368878469939104, + "step": 5200 + }, + { + "epoch": 0.77, + "learning_rate": 9.648367952522256e-06, + "loss": 1.4258, + "step": 5240 + }, + { + "epoch": 0.77, + "eval_loss": 1.3950155973434448, + "eval_runtime": 519.7331, + "eval_samples_per_second": 14.698, + "eval_wer": 0.4323165327768089, + "step": 5240 + }, + { + "epoch": 0.78, + "learning_rate": 9.64540059347181e-06, + "loss": 1.3655, + "step": 5280 + }, + { + "epoch": 0.78, + "eval_loss": 1.425440788269043, + "eval_runtime": 515.6073, + "eval_samples_per_second": 14.816, + "eval_wer": 0.43471797364132764, + "step": 5280 + }, + { + "epoch": 0.79, + "learning_rate": 9.642433234421365e-06, + "loss": 1.4751, + "step": 5320 + }, + { + "epoch": 0.79, + "eval_loss": 1.3840967416763306, + "eval_runtime": 516.6867, + "eval_samples_per_second": 14.785, + "eval_wer": 0.4313445209983133, + "step": 5320 + }, + { + "epoch": 0.79, + "learning_rate": 9.63946587537092e-06, + "loss": 1.4119, + "step": 5360 + }, + { + "epoch": 0.79, + "eval_loss": 1.3902742862701416, + "eval_runtime": 516.1815, + "eval_samples_per_second": 14.799, + "eval_wer": 0.43148746390691556, + "step": 5360 + }, + { + "epoch": 0.8, + "learning_rate": 9.636498516320476e-06, + "loss": 1.4392, + "step": 5400 + }, + { + "epoch": 0.8, + "eval_loss": 1.4150809049606323, + "eval_runtime": 516.3127, + "eval_samples_per_second": 14.795, + "eval_wer": 0.4343463220789617, + "step": 5400 + }, + { + "epoch": 0.8, + "learning_rate": 9.63353115727003e-06, + "loss": 1.4046, + "step": 5440 + }, + { + "epoch": 0.8, + "eval_loss": 1.3621487617492676, + "eval_runtime": 517.564, + "eval_samples_per_second": 14.76, + "eval_wer": 0.4298579147488493, + "step": 5440 + }, + { + "epoch": 0.81, + "learning_rate": 9.630563798219585e-06, + "loss": 1.3454, + "step": 5480 + }, + { + "epoch": 0.81, + "eval_loss": 1.4361683130264282, + "eval_runtime": 515.6033, + "eval_samples_per_second": 14.816, + "eval_wer": 0.43609022556390975, + "step": 5480 + }, + { + "epoch": 0.82, + "learning_rate": 9.627596439169141e-06, + "loss": 1.4559, + "step": 5520 + }, + { + "epoch": 0.82, + "eval_loss": 1.3505635261535645, + "eval_runtime": 516.6128, + "eval_samples_per_second": 14.787, + "eval_wer": 0.4301723891477744, + "step": 5520 + }, + { + "epoch": 0.82, + "learning_rate": 9.624629080118695e-06, + "loss": 1.4474, + "step": 5560 + }, + { + "epoch": 0.82, + "eval_loss": 1.2954375743865967, + "eval_runtime": 516.5953, + "eval_samples_per_second": 14.787, + "eval_wer": 0.42542668458217786, + "step": 5560 + }, + { + "epoch": 0.83, + "learning_rate": 9.62166172106825e-06, + "loss": 1.4003, + "step": 5600 + }, + { + "epoch": 0.83, + "eval_loss": 1.3330990076065063, + "eval_runtime": 515.8012, + "eval_samples_per_second": 14.81, + "eval_wer": 0.4281997770090626, + "step": 5600 + }, + { + "epoch": 0.83, + "learning_rate": 9.618694362017806e-06, + "loss": 1.3783, + "step": 5640 + }, + { + "epoch": 0.83, + "eval_loss": 1.3351558446884155, + "eval_runtime": 514.9496, + "eval_samples_per_second": 14.834, + "eval_wer": 0.4280568341004603, + "step": 5640 + }, + { + "epoch": 0.84, + "learning_rate": 9.61572700296736e-06, + "loss": 1.2803, + "step": 5680 + }, + { + "epoch": 0.84, + "eval_loss": 1.4254976511001587, + "eval_runtime": 516.2286, + "eval_samples_per_second": 14.798, + "eval_wer": 0.43500385945853226, + "step": 5680 + }, + { + "epoch": 0.85, + "learning_rate": 9.612759643916915e-06, + "loss": 1.3915, + "step": 5720 + }, + { + "epoch": 0.85, + "eval_loss": 1.351941704750061, + "eval_runtime": 516.9013, + "eval_samples_per_second": 14.778, + "eval_wer": 0.4287715486434718, + "step": 5720 + }, + { + "epoch": 0.85, + "learning_rate": 9.60979228486647e-06, + "loss": 1.3142, + "step": 5760 + }, + { + "epoch": 0.85, + "eval_loss": 1.4030635356903076, + "eval_runtime": 515.3754, + "eval_samples_per_second": 14.822, + "eval_wer": 0.43097286943594726, + "step": 5760 + }, + { + "epoch": 0.86, + "learning_rate": 9.606824925816024e-06, + "loss": 1.3912, + "step": 5800 + }, + { + "epoch": 0.86, + "eval_loss": 1.3692469596862793, + "eval_runtime": 517.234, + "eval_samples_per_second": 14.769, + "eval_wer": 0.4290002572972355, + "step": 5800 + }, + { + "epoch": 0.86, + "learning_rate": 9.60385756676558e-06, + "loss": 1.3827, + "step": 5840 + }, + { + "epoch": 0.86, + "eval_loss": 1.354949712753296, + "eval_runtime": 515.804, + "eval_samples_per_second": 14.81, + "eval_wer": 0.42705623374024415, + "step": 5840 + }, + { + "epoch": 0.87, + "learning_rate": 9.600890207715134e-06, + "loss": 1.3959, + "step": 5880 + }, + { + "epoch": 0.87, + "eval_loss": 1.4425711631774902, + "eval_runtime": 514.9528, + "eval_samples_per_second": 14.834, + "eval_wer": 0.434117613425198, + "step": 5880 + }, + { + "epoch": 0.87, + "learning_rate": 9.597922848664689e-06, + "loss": 1.3335, + "step": 5920 + }, + { + "epoch": 0.87, + "eval_loss": 1.3389842510223389, + "eval_runtime": 515.6002, + "eval_samples_per_second": 14.816, + "eval_wer": 0.42628434203379173, + "step": 5920 + }, + { + "epoch": 0.88, + "learning_rate": 9.594955489614243e-06, + "loss": 1.3211, + "step": 5960 + }, + { + "epoch": 0.88, + "eval_loss": 1.4448662996292114, + "eval_runtime": 517.1767, + "eval_samples_per_second": 14.771, + "eval_wer": 0.43285971582949767, + "step": 5960 + }, + { + "epoch": 0.89, + "learning_rate": 9.5919881305638e-06, + "loss": 1.339, + "step": 6000 + }, + { + "epoch": 0.89, + "eval_loss": 1.3400218486785889, + "eval_runtime": 516.8274, + "eval_samples_per_second": 14.781, + "eval_wer": 0.4251122101832528, + "step": 6000 + }, + { + "epoch": 0.89, + "learning_rate": 9.589020771513354e-06, + "loss": 1.372, + "step": 6040 + }, + { + "epoch": 0.89, + "eval_loss": 1.3646411895751953, + "eval_runtime": 515.8442, + "eval_samples_per_second": 14.809, + "eval_wer": 0.4270276451585237, + "step": 6040 + }, + { + "epoch": 0.9, + "learning_rate": 9.586053412462908e-06, + "loss": 1.3864, + "step": 6080 + }, + { + "epoch": 0.9, + "eval_loss": 1.357338547706604, + "eval_runtime": 516.0993, + "eval_samples_per_second": 14.801, + "eval_wer": 0.42654163926927585, + "step": 6080 + }, + { + "epoch": 0.9, + "learning_rate": 9.583086053412464e-06, + "loss": 1.3097, + "step": 6120 + }, + { + "epoch": 0.9, + "eval_loss": 1.4197887182235718, + "eval_runtime": 515.7773, + "eval_samples_per_second": 14.811, + "eval_wer": 0.42960061751336515, + "step": 6120 + }, + { + "epoch": 0.91, + "learning_rate": 9.580118694362019e-06, + "loss": 1.3551, + "step": 6160 + }, + { + "epoch": 0.91, + "eval_loss": 1.4010227918624878, + "eval_runtime": 516.7255, + "eval_samples_per_second": 14.783, + "eval_wer": 0.427542239629492, + "step": 6160 + }, + { + "epoch": 0.92, + "learning_rate": 9.577151335311573e-06, + "loss": 1.2897, + "step": 6200 + }, + { + "epoch": 0.92, + "eval_loss": 1.4033058881759644, + "eval_runtime": 516.6256, + "eval_samples_per_second": 14.786, + "eval_wer": 0.4273421195574488, + "step": 6200 + }, + { + "epoch": 0.92, + "learning_rate": 9.57418397626113e-06, + "loss": 1.3949, + "step": 6240 + }, + { + "epoch": 0.92, + "eval_loss": 1.3815839290618896, + "eval_runtime": 516.1636, + "eval_samples_per_second": 14.8, + "eval_wer": 0.4258269247262643, + "step": 6240 + }, + { + "epoch": 0.93, + "learning_rate": 9.571216617210684e-06, + "loss": 1.4411, + "step": 6280 + }, + { + "epoch": 0.93, + "eval_loss": 1.317184567451477, + "eval_runtime": 516.4932, + "eval_samples_per_second": 14.79, + "eval_wer": 0.4220532319391635, + "step": 6280 + }, + { + "epoch": 0.93, + "learning_rate": 9.568249258160238e-06, + "loss": 1.3632, + "step": 6320 + }, + { + "epoch": 0.93, + "eval_loss": 1.409461498260498, + "eval_runtime": 516.0299, + "eval_samples_per_second": 14.803, + "eval_wer": 0.42662740501443724, + "step": 6320 + }, + { + "epoch": 0.94, + "learning_rate": 9.565281899109793e-06, + "loss": 1.4314, + "step": 6360 + }, + { + "epoch": 0.94, + "eval_loss": 1.3631606101989746, + "eval_runtime": 515.6547, + "eval_samples_per_second": 14.814, + "eval_wer": 0.42448326138540265, + "step": 6360 + }, + { + "epoch": 0.95, + "learning_rate": 9.562314540059347e-06, + "loss": 1.3763, + "step": 6400 + }, + { + "epoch": 0.95, + "eval_loss": 1.3963958024978638, + "eval_runtime": 515.7604, + "eval_samples_per_second": 14.811, + "eval_wer": 0.4268275250864805, + "step": 6400 + }, + { + "epoch": 0.95, + "learning_rate": 9.559347181008903e-06, + "loss": 1.4094, + "step": 6440 + }, + { + "epoch": 0.95, + "eval_loss": 1.3508167266845703, + "eval_runtime": 517.1098, + "eval_samples_per_second": 14.772, + "eval_wer": 0.42448326138540265, + "step": 6440 + }, + { + "epoch": 0.96, + "learning_rate": 9.556379821958458e-06, + "loss": 1.4234, + "step": 6480 + }, + { + "epoch": 0.96, + "eval_loss": 1.3754290342330933, + "eval_runtime": 516.7121, + "eval_samples_per_second": 14.784, + "eval_wer": 0.42668458217787814, + "step": 6480 + }, + { + "epoch": 0.96, + "learning_rate": 9.553412462908012e-06, + "loss": 1.3401, + "step": 6520 + }, + { + "epoch": 0.96, + "eval_loss": 1.33858323097229, + "eval_runtime": 516.484, + "eval_samples_per_second": 14.79, + "eval_wer": 0.423511249606907, + "step": 6520 + }, + { + "epoch": 0.97, + "learning_rate": 9.550445103857568e-06, + "loss": 1.3512, + "step": 6560 + }, + { + "epoch": 0.97, + "eval_loss": 1.3395580053329468, + "eval_runtime": 516.7199, + "eval_samples_per_second": 14.784, + "eval_wer": 0.4231681866262615, + "step": 6560 + }, + { + "epoch": 0.98, + "learning_rate": 9.547477744807123e-06, + "loss": 1.399, + "step": 6600 + }, + { + "epoch": 0.98, + "eval_loss": 1.3298590183258057, + "eval_runtime": 516.172, + "eval_samples_per_second": 14.799, + "eval_wer": 0.42202464335744305, + "step": 6600 + }, + { + "epoch": 0.98, + "learning_rate": 9.544510385756677e-06, + "loss": 1.3191, + "step": 6640 + }, + { + "epoch": 0.98, + "eval_loss": 1.3099309206008911, + "eval_runtime": 516.2612, + "eval_samples_per_second": 14.797, + "eval_wer": 0.4207667457617428, + "step": 6640 + }, + { + "epoch": 0.99, + "learning_rate": 9.541543026706233e-06, + "loss": 1.3806, + "step": 6680 + }, + { + "epoch": 0.99, + "eval_loss": 1.3367770910263062, + "eval_runtime": 517.6382, + "eval_samples_per_second": 14.757, + "eval_wer": 0.4223391177563681, + "step": 6680 + }, + { + "epoch": 0.99, + "learning_rate": 9.538575667655788e-06, + "loss": 1.3752, + "step": 6720 + }, + { + "epoch": 0.99, + "eval_loss": 1.3307867050170898, + "eval_runtime": 517.9335, + "eval_samples_per_second": 14.749, + "eval_wer": 0.4213099288144315, + "step": 6720 + }, + { + "epoch": 1.0, + "learning_rate": 9.535608308605342e-06, + "loss": 1.4227, + "step": 6760 + }, + { + "epoch": 1.0, + "eval_loss": 1.3376935720443726, + "eval_runtime": 516.5144, + "eval_samples_per_second": 14.79, + "eval_wer": 0.42113839732410874, + "step": 6760 + }, + { + "epoch": 1.01, + "learning_rate": 9.532640949554897e-06, + "loss": 1.3955, + "step": 6800 + }, + { + "epoch": 1.01, + "eval_loss": 1.3533991575241089, + "eval_runtime": 514.6016, + "eval_samples_per_second": 14.844, + "eval_wer": 0.4216244032133566, + "step": 6800 + }, + { + "epoch": 1.01, + "learning_rate": 9.529673590504451e-06, + "loss": 1.3004, + "step": 6840 + }, + { + "epoch": 1.01, + "eval_loss": 1.391702651977539, + "eval_runtime": 511.4823, + "eval_samples_per_second": 14.935, + "eval_wer": 0.4236541925155093, + "step": 6840 + }, + { + "epoch": 1.02, + "learning_rate": 9.526706231454007e-06, + "loss": 1.3724, + "step": 6880 + }, + { + "epoch": 1.02, + "eval_loss": 1.3138071298599243, + "eval_runtime": 511.2435, + "eval_samples_per_second": 14.942, + "eval_wer": 0.42013779696389264, + "step": 6880 + }, + { + "epoch": 1.02, + "learning_rate": 9.523738872403562e-06, + "loss": 1.3202, + "step": 6920 + }, + { + "epoch": 1.02, + "eval_loss": 1.3417410850524902, + "eval_runtime": 510.1636, + "eval_samples_per_second": 14.974, + "eval_wer": 0.42090968867034506, + "step": 6920 + }, + { + "epoch": 1.03, + "learning_rate": 9.520771513353116e-06, + "loss": 1.3622, + "step": 6960 + }, + { + "epoch": 1.03, + "eval_loss": 1.3786414861679077, + "eval_runtime": 511.1358, + "eval_samples_per_second": 14.945, + "eval_wer": 0.42362560393378884, + "step": 6960 + }, + { + "epoch": 1.03, + "learning_rate": 9.51780415430267e-06, + "loss": 1.3068, + "step": 7000 + }, + { + "epoch": 1.03, + "eval_loss": 1.2920615673065186, + "eval_runtime": 510.9693, + "eval_samples_per_second": 14.95, + "eval_wer": 0.4182795391520627, + "step": 7000 + }, + { + "epoch": 1.04, + "learning_rate": 9.514836795252227e-06, + "loss": 1.3176, + "step": 7040 + }, + { + "epoch": 1.04, + "eval_loss": 1.3531546592712402, + "eval_runtime": 512.3523, + "eval_samples_per_second": 14.91, + "eval_wer": 0.42225335201120673, + "step": 7040 + }, + { + "epoch": 1.05, + "learning_rate": 9.511869436201781e-06, + "loss": 1.3745, + "step": 7080 + }, + { + "epoch": 1.05, + "eval_loss": 1.3547227382659912, + "eval_runtime": 510.962, + "eval_samples_per_second": 14.95, + "eval_wer": 0.4216815803767975, + "step": 7080 + }, + { + "epoch": 1.05, + "learning_rate": 9.508902077151336e-06, + "loss": 1.3685, + "step": 7120 + }, + { + "epoch": 1.05, + "eval_loss": 1.3625860214233398, + "eval_runtime": 511.2574, + "eval_samples_per_second": 14.942, + "eval_wer": 0.4227107693187341, + "step": 7120 + }, + { + "epoch": 1.06, + "learning_rate": 9.505934718100892e-06, + "loss": 1.3105, + "step": 7160 + }, + { + "epoch": 1.06, + "eval_loss": 1.3234022855758667, + "eval_runtime": 510.0229, + "eval_samples_per_second": 14.978, + "eval_wer": 0.4194230824208811, + "step": 7160 + }, + { + "epoch": 1.06, + "learning_rate": 9.502967359050446e-06, + "loss": 1.3262, + "step": 7200 + }, + { + "epoch": 1.06, + "eval_loss": 1.3344852924346924, + "eval_runtime": 511.4089, + "eval_samples_per_second": 14.937, + "eval_wer": 0.42030932845421537, + "step": 7200 + }, + { + "epoch": 1.07, + "learning_rate": 9.5e-06, + "loss": 1.4309, + "step": 7240 + }, + { + "epoch": 1.07, + "eval_loss": 1.3332602977752686, + "eval_runtime": 511.2875, + "eval_samples_per_second": 14.941, + "eval_wer": 0.41970896823808573, + "step": 7240 + }, + { + "epoch": 1.08, + "learning_rate": 9.497032640949557e-06, + "loss": 1.3147, + "step": 7280 + }, + { + "epoch": 1.08, + "eval_loss": 1.2827751636505127, + "eval_runtime": 510.3482, + "eval_samples_per_second": 14.968, + "eval_wer": 0.4161639841047486, + "step": 7280 + }, + { + "epoch": 1.08, + "learning_rate": 9.494065281899111e-06, + "loss": 1.2877, + "step": 7320 + }, + { + "epoch": 1.08, + "eval_loss": 1.3272523880004883, + "eval_runtime": 511.7716, + "eval_samples_per_second": 14.927, + "eval_wer": 0.4184796592241059, + "step": 7320 + }, + { + "epoch": 1.09, + "learning_rate": 9.491097922848666e-06, + "loss": 1.3402, + "step": 7360 + }, + { + "epoch": 1.09, + "eval_loss": 1.3485498428344727, + "eval_runtime": 509.9959, + "eval_samples_per_second": 14.979, + "eval_wer": 0.419480259584322, + "step": 7360 + }, + { + "epoch": 1.09, + "learning_rate": 9.48813056379822e-06, + "loss": 1.312, + "step": 7400 + }, + { + "epoch": 1.09, + "eval_loss": 1.3199102878570557, + "eval_runtime": 510.0484, + "eval_samples_per_second": 14.977, + "eval_wer": 0.41867977929614913, + "step": 7400 + }, + { + "epoch": 1.1, + "learning_rate": 9.485163204747774e-06, + "loss": 1.4253, + "step": 7440 + }, + { + "epoch": 1.1, + "eval_loss": 1.2967960834503174, + "eval_runtime": 510.4372, + "eval_samples_per_second": 14.966, + "eval_wer": 0.41696446439292145, + "step": 7440 + }, + { + "epoch": 1.11, + "learning_rate": 9.48219584569733e-06, + "loss": 1.3595, + "step": 7480 + }, + { + "epoch": 1.11, + "eval_loss": 1.3033524751663208, + "eval_runtime": 515.2696, + "eval_samples_per_second": 14.825, + "eval_wer": 0.41596386403270535, + "step": 7480 + }, + { + "epoch": 1.11, + "learning_rate": 9.479228486646885e-06, + "loss": 1.3299, + "step": 7520 + }, + { + "epoch": 1.11, + "eval_loss": 1.3706648349761963, + "eval_runtime": 510.0742, + "eval_samples_per_second": 14.976, + "eval_wer": 0.42156722604991564, + "step": 7520 + }, + { + "epoch": 1.12, + "learning_rate": 9.47626112759644e-06, + "loss": 1.2884, + "step": 7560 + }, + { + "epoch": 1.12, + "eval_loss": 1.3058663606643677, + "eval_runtime": 512.8596, + "eval_samples_per_second": 14.895, + "eval_wer": 0.41553503530689845, + "step": 7560 + }, + { + "epoch": 1.12, + "learning_rate": 9.473293768545994e-06, + "loss": 1.2962, + "step": 7600 + }, + { + "epoch": 1.12, + "eval_loss": 1.3642096519470215, + "eval_runtime": 512.3802, + "eval_samples_per_second": 14.909, + "eval_wer": 0.41825095057034223, + "step": 7600 + }, + { + "epoch": 1.13, + "learning_rate": 9.47032640949555e-06, + "loss": 1.3444, + "step": 7640 + }, + { + "epoch": 1.13, + "eval_loss": 1.2833493947982788, + "eval_runtime": 513.3652, + "eval_samples_per_second": 14.88, + "eval_wer": 0.4122473484090454, + "step": 7640 + }, + { + "epoch": 1.14, + "learning_rate": 9.467359050445104e-06, + "loss": 1.2525, + "step": 7680 + }, + { + "epoch": 1.14, + "eval_loss": 1.3346291780471802, + "eval_runtime": 510.8062, + "eval_samples_per_second": 14.955, + "eval_wer": 0.4157637439606621, + "step": 7680 + }, + { + "epoch": 1.14, + "learning_rate": 9.46439169139466e-06, + "loss": 1.3447, + "step": 7720 + }, + { + "epoch": 1.14, + "eval_loss": 1.3114800453186035, + "eval_runtime": 513.4957, + "eval_samples_per_second": 14.876, + "eval_wer": 0.41516338374453243, + "step": 7720 + }, + { + "epoch": 1.15, + "learning_rate": 9.461424332344215e-06, + "loss": 1.3206, + "step": 7760 + }, + { + "epoch": 1.15, + "eval_loss": 1.3263444900512695, + "eval_runtime": 512.3013, + "eval_samples_per_second": 14.911, + "eval_wer": 0.41696446439292145, + "step": 7760 + }, + { + "epoch": 1.15, + "learning_rate": 9.45845697329377e-06, + "loss": 1.2992, + "step": 7800 + }, + { + "epoch": 1.15, + "eval_loss": 1.3342244625091553, + "eval_runtime": 511.7586, + "eval_samples_per_second": 14.927, + "eval_wer": 0.41670716715743733, + "step": 7800 + }, + { + "epoch": 1.16, + "learning_rate": 9.455489614243324e-06, + "loss": 1.2609, + "step": 7840 + }, + { + "epoch": 1.16, + "eval_loss": 1.2615351676940918, + "eval_runtime": 512.2206, + "eval_samples_per_second": 14.913, + "eval_wer": 0.4109322736499042, + "step": 7840 + }, + { + "epoch": 1.16, + "learning_rate": 9.452522255192878e-06, + "loss": 1.4939, + "step": 7880 + }, + { + "epoch": 1.16, + "eval_loss": 1.2486201524734497, + "eval_runtime": 516.8318, + "eval_samples_per_second": 14.78, + "eval_wer": 0.4109608622316247, + "step": 7880 + }, + { + "epoch": 1.17, + "learning_rate": 9.449554896142435e-06, + "loss": 1.2853, + "step": 7920 + }, + { + "epoch": 1.17, + "eval_loss": 1.3589729070663452, + "eval_runtime": 511.4097, + "eval_samples_per_second": 14.937, + "eval_wer": 0.418050830498299, + "step": 7920 + }, + { + "epoch": 1.18, + "learning_rate": 9.446587537091989e-06, + "loss": 1.3019, + "step": 7960 + }, + { + "epoch": 1.18, + "eval_loss": 1.2761421203613281, + "eval_runtime": 512.9489, + "eval_samples_per_second": 14.892, + "eval_wer": 0.4124760570628091, + "step": 7960 + }, + { + "epoch": 1.18, + "learning_rate": 9.443620178041543e-06, + "loss": 1.2466, + "step": 8000 + }, + { + "epoch": 1.18, + "eval_loss": 1.3334859609603882, + "eval_runtime": 510.8992, + "eval_samples_per_second": 14.952, + "eval_wer": 0.4163355155950713, + "step": 8000 + }, + { + "epoch": 1.19, + "learning_rate": 9.440652818991098e-06, + "loss": 1.4193, + "step": 8040 + }, + { + "epoch": 1.19, + "eval_loss": 1.2380253076553345, + "eval_runtime": 511.7445, + "eval_samples_per_second": 14.927, + "eval_wer": 0.4116183996111953, + "step": 8040 + }, + { + "epoch": 1.19, + "learning_rate": 9.437685459940652e-06, + "loss": 1.2979, + "step": 8080 + }, + { + "epoch": 1.19, + "eval_loss": 1.34476900100708, + "eval_runtime": 511.4657, + "eval_samples_per_second": 14.936, + "eval_wer": 0.41842248206066496, + "step": 8080 + }, + { + "epoch": 1.2, + "learning_rate": 9.434718100890208e-06, + "loss": 1.2847, + "step": 8120 + }, + { + "epoch": 1.2, + "eval_loss": 1.3185465335845947, + "eval_runtime": 512.9377, + "eval_samples_per_second": 14.893, + "eval_wer": 0.4161639841047486, + "step": 8120 + }, + { + "epoch": 1.21, + "learning_rate": 9.431750741839763e-06, + "loss": 1.3004, + "step": 8160 + }, + { + "epoch": 1.21, + "eval_loss": 1.3402063846588135, + "eval_runtime": 511.9363, + "eval_samples_per_second": 14.922, + "eval_wer": 0.4189084879499128, + "step": 8160 + }, + { + "epoch": 1.21, + "learning_rate": 9.428783382789319e-06, + "loss": 1.3362, + "step": 8200 + }, + { + "epoch": 1.21, + "eval_loss": 1.3436304330825806, + "eval_runtime": 511.6865, + "eval_samples_per_second": 14.929, + "eval_wer": 0.41825095057034223, + "step": 8200 + }, + { + "epoch": 1.22, + "learning_rate": 9.425816023738873e-06, + "loss": 1.296, + "step": 8240 + }, + { + "epoch": 1.22, + "eval_loss": 1.2706687450408936, + "eval_runtime": 512.2774, + "eval_samples_per_second": 14.912, + "eval_wer": 0.4124760570628091, + "step": 8240 + }, + { + "epoch": 1.22, + "learning_rate": 9.422848664688428e-06, + "loss": 1.2576, + "step": 8280 + }, + { + "epoch": 1.22, + "eval_loss": 1.2736766338348389, + "eval_runtime": 511.8436, + "eval_samples_per_second": 14.924, + "eval_wer": 0.4117041653563567, + "step": 8280 + }, + { + "epoch": 1.23, + "learning_rate": 9.419881305637984e-06, + "loss": 1.2528, + "step": 8320 + }, + { + "epoch": 1.23, + "eval_loss": 1.3490320444107056, + "eval_runtime": 511.6838, + "eval_samples_per_second": 14.929, + "eval_wer": 0.41670716715743733, + "step": 8320 + }, + { + "epoch": 1.24, + "learning_rate": 9.416913946587538e-06, + "loss": 1.2786, + "step": 8360 + }, + { + "epoch": 1.24, + "eval_loss": 1.3121426105499268, + "eval_runtime": 510.9949, + "eval_samples_per_second": 14.949, + "eval_wer": 0.4135052460047457, + "step": 8360 + }, + { + "epoch": 1.24, + "learning_rate": 9.413946587537093e-06, + "loss": 1.3974, + "step": 8400 + }, + { + "epoch": 1.24, + "eval_loss": 1.2293121814727783, + "eval_runtime": 512.0033, + "eval_samples_per_second": 14.92, + "eval_wer": 0.40850224420366504, + "step": 8400 + }, + { + "epoch": 1.25, + "learning_rate": 9.410979228486647e-06, + "loss": 1.289, + "step": 8440 + }, + { + "epoch": 1.25, + "eval_loss": 1.312703251838684, + "eval_runtime": 511.7291, + "eval_samples_per_second": 14.928, + "eval_wer": 0.41439149203808, + "step": 8440 + }, + { + "epoch": 1.25, + "learning_rate": 9.408011869436202e-06, + "loss": 1.3042, + "step": 8480 + }, + { + "epoch": 1.25, + "eval_loss": 1.2950646877288818, + "eval_runtime": 511.6576, + "eval_samples_per_second": 14.93, + "eval_wer": 0.41304782869721834, + "step": 8480 + }, + { + "epoch": 1.26, + "learning_rate": 9.405044510385758e-06, + "loss": 1.3192, + "step": 8520 + }, + { + "epoch": 1.26, + "eval_loss": 1.2467378377914429, + "eval_runtime": 511.3151, + "eval_samples_per_second": 14.94, + "eval_wer": 0.4099316732896881, + "step": 8520 + }, + { + "epoch": 1.27, + "learning_rate": 9.402077151335312e-06, + "loss": 1.2991, + "step": 8560 + }, + { + "epoch": 1.27, + "eval_loss": 1.3041272163391113, + "eval_runtime": 514.8761, + "eval_samples_per_second": 14.837, + "eval_wer": 0.4144486692015209, + "step": 8560 + }, + { + "epoch": 1.27, + "learning_rate": 9.399109792284867e-06, + "loss": 1.2369, + "step": 8600 + }, + { + "epoch": 1.27, + "eval_loss": 1.3044118881225586, + "eval_runtime": 513.4671, + "eval_samples_per_second": 14.877, + "eval_wer": 0.41507761799937104, + "step": 8600 + }, + { + "epoch": 1.28, + "learning_rate": 9.396142433234421e-06, + "loss": 1.2538, + "step": 8640 + }, + { + "epoch": 1.28, + "eval_loss": 1.2771389484405518, + "eval_runtime": 512.6229, + "eval_samples_per_second": 14.902, + "eval_wer": 0.41187569684667946, + "step": 8640 + }, + { + "epoch": 1.28, + "learning_rate": 9.393175074183977e-06, + "loss": 1.274, + "step": 8680 + }, + { + "epoch": 1.28, + "eval_loss": 1.3738703727722168, + "eval_runtime": 514.2482, + "eval_samples_per_second": 14.855, + "eval_wer": 0.4177649446810944, + "step": 8680 + }, + { + "epoch": 1.29, + "learning_rate": 9.390207715133532e-06, + "loss": 1.3129, + "step": 8720 + }, + { + "epoch": 1.29, + "eval_loss": 1.3008581399917603, + "eval_runtime": 512.9228, + "eval_samples_per_second": 14.893, + "eval_wer": 0.4133623030961434, + "step": 8720 + }, + { + "epoch": 1.29, + "learning_rate": 9.387240356083088e-06, + "loss": 1.2148, + "step": 8760 + }, + { + "epoch": 1.29, + "eval_loss": 1.3074074983596802, + "eval_runtime": 512.994, + "eval_samples_per_second": 14.891, + "eval_wer": 0.4138483089853912, + "step": 8760 + }, + { + "epoch": 1.3, + "learning_rate": 9.384272997032642e-06, + "loss": 1.405, + "step": 8800 + }, + { + "epoch": 1.3, + "eval_loss": 1.2787606716156006, + "eval_runtime": 515.1034, + "eval_samples_per_second": 14.83, + "eval_wer": 0.411475456702593, + "step": 8800 + }, + { + "epoch": 1.31, + "learning_rate": 9.381305637982197e-06, + "loss": 1.2723, + "step": 8840 + }, + { + "epoch": 1.31, + "eval_loss": 1.2887216806411743, + "eval_runtime": 511.9564, + "eval_samples_per_second": 14.921, + "eval_wer": 0.41236170273592726, + "step": 8840 + }, + { + "epoch": 1.31, + "learning_rate": 9.378338278931751e-06, + "loss": 1.2829, + "step": 8880 + }, + { + "epoch": 1.31, + "eval_loss": 1.2829817533493042, + "eval_runtime": 511.8011, + "eval_samples_per_second": 14.926, + "eval_wer": 0.41176134251979757, + "step": 8880 + }, + { + "epoch": 1.32, + "learning_rate": 9.375370919881306e-06, + "loss": 1.3702, + "step": 8920 + }, + { + "epoch": 1.32, + "eval_loss": 1.29217529296875, + "eval_runtime": 511.7848, + "eval_samples_per_second": 14.926, + "eval_wer": 0.4116183996111953, + "step": 8920 + }, + { + "epoch": 1.32, + "learning_rate": 9.372403560830862e-06, + "loss": 1.281, + "step": 8960 + }, + { + "epoch": 1.32, + "eval_loss": 1.2968708276748657, + "eval_runtime": 513.6716, + "eval_samples_per_second": 14.871, + "eval_wer": 0.41041767917893596, + "step": 8960 + }, + { + "epoch": 1.33, + "learning_rate": 9.369436201780416e-06, + "loss": 1.2917, + "step": 9000 + }, + { + "epoch": 1.33, + "eval_loss": 1.3134349584579468, + "eval_runtime": 512.644, + "eval_samples_per_second": 14.901, + "eval_wer": 0.41219017124560453, + "step": 9000 + }, + { + "epoch": 1.34, + "learning_rate": 9.36646884272997e-06, + "loss": 1.2533, + "step": 9040 + }, + { + "epoch": 1.34, + "eval_loss": 1.2987614870071411, + "eval_runtime": 511.8914, + "eval_samples_per_second": 14.923, + "eval_wer": 0.4119614625918408, + "step": 9040 + }, + { + "epoch": 1.34, + "learning_rate": 9.363501483679525e-06, + "loss": 1.1882, + "step": 9080 + }, + { + "epoch": 1.34, + "eval_loss": 1.366603136062622, + "eval_runtime": 512.2776, + "eval_samples_per_second": 14.912, + "eval_wer": 0.4163641041767918, + "step": 9080 + }, + { + "epoch": 1.35, + "learning_rate": 9.36053412462908e-06, + "loss": 1.3309, + "step": 9120 + }, + { + "epoch": 1.35, + "eval_loss": 1.25356924533844, + "eval_runtime": 513.5071, + "eval_samples_per_second": 14.876, + "eval_wer": 0.40893107292947195, + "step": 9120 + }, + { + "epoch": 1.35, + "learning_rate": 9.357566765578636e-06, + "loss": 1.3681, + "step": 9160 + }, + { + "epoch": 1.35, + "eval_loss": 1.3336553573608398, + "eval_runtime": 516.6108, + "eval_samples_per_second": 14.787, + "eval_wer": 0.4156493896337803, + "step": 9160 + }, + { + "epoch": 1.36, + "learning_rate": 9.35459940652819e-06, + "loss": 1.266, + "step": 9200 + }, + { + "epoch": 1.36, + "eval_loss": 1.270060658454895, + "eval_runtime": 511.859, + "eval_samples_per_second": 14.924, + "eval_wer": 0.41098945081334515, + "step": 9200 + }, + { + "epoch": 1.37, + "learning_rate": 9.351632047477746e-06, + "loss": 1.3068, + "step": 9240 + }, + { + "epoch": 1.37, + "eval_loss": 1.2187365293502808, + "eval_runtime": 513.7027, + "eval_samples_per_second": 14.87, + "eval_wer": 0.4092741359101175, + "step": 9240 + }, + { + "epoch": 1.37, + "learning_rate": 9.3486646884273e-06, + "loss": 1.2812, + "step": 9280 + }, + { + "epoch": 1.37, + "eval_loss": 1.2569447755813599, + "eval_runtime": 512.9118, + "eval_samples_per_second": 14.893, + "eval_wer": 0.4098459075445267, + "step": 9280 + }, + { + "epoch": 1.38, + "learning_rate": 9.345697329376855e-06, + "loss": 1.2683, + "step": 9320 + }, + { + "epoch": 1.38, + "eval_loss": 1.2560864686965942, + "eval_runtime": 512.9368, + "eval_samples_per_second": 14.893, + "eval_wer": 0.4077303524972126, + "step": 9320 + }, + { + "epoch": 1.38, + "learning_rate": 9.342729970326411e-06, + "loss": 1.277, + "step": 9360 + }, + { + "epoch": 1.38, + "eval_loss": 1.3354778289794922, + "eval_runtime": 512.9536, + "eval_samples_per_second": 14.892, + "eval_wer": 0.41361960033162753, + "step": 9360 + }, + { + "epoch": 1.39, + "learning_rate": 9.339762611275966e-06, + "loss": 1.3425, + "step": 9400 + }, + { + "epoch": 1.39, + "eval_loss": 1.2977571487426758, + "eval_runtime": 514.5297, + "eval_samples_per_second": 14.847, + "eval_wer": 0.41033191343377456, + "step": 9400 + }, + { + "epoch": 1.4, + "learning_rate": 9.33679525222552e-06, + "loss": 1.2072, + "step": 9440 + }, + { + "epoch": 1.4, + "eval_loss": 1.3424071073532104, + "eval_runtime": 512.9194, + "eval_samples_per_second": 14.893, + "eval_wer": 0.41356242316818664, + "step": 9440 + }, + { + "epoch": 1.4, + "learning_rate": 9.333827893175075e-06, + "loss": 1.2499, + "step": 9480 + }, + { + "epoch": 1.4, + "eval_loss": 1.260184645652771, + "eval_runtime": 513.0866, + "eval_samples_per_second": 14.888, + "eval_wer": 0.4076731753337717, + "step": 9480 + }, + { + "epoch": 1.41, + "learning_rate": 9.330860534124629e-06, + "loss": 1.3242, + "step": 9520 + }, + { + "epoch": 1.41, + "eval_loss": 1.2436482906341553, + "eval_runtime": 512.6621, + "eval_samples_per_second": 14.901, + "eval_wer": 0.40698704937248065, + "step": 9520 + }, + { + "epoch": 1.41, + "learning_rate": 9.327893175074185e-06, + "loss": 1.2121, + "step": 9560 + }, + { + "epoch": 1.41, + "eval_loss": 1.315924048423767, + "eval_runtime": 517.4858, + "eval_samples_per_second": 14.762, + "eval_wer": 0.4115612224477544, + "step": 9560 + }, + { + "epoch": 1.42, + "learning_rate": 9.32492581602374e-06, + "loss": 1.2659, + "step": 9600 + }, + { + "epoch": 1.42, + "eval_loss": 1.3112881183624268, + "eval_runtime": 513.0476, + "eval_samples_per_second": 14.889, + "eval_wer": 0.41136110237571116, + "step": 9600 + }, + { + "epoch": 1.42, + "learning_rate": 9.321958456973294e-06, + "loss": 1.2823, + "step": 9640 + }, + { + "epoch": 1.42, + "eval_loss": 1.255016565322876, + "eval_runtime": 512.8326, + "eval_samples_per_second": 14.896, + "eval_wer": 0.4077303524972126, + "step": 9640 + }, + { + "epoch": 1.43, + "learning_rate": 9.318991097922849e-06, + "loss": 1.308, + "step": 9680 + }, + { + "epoch": 1.43, + "eval_loss": 1.2840029001235962, + "eval_runtime": 513.1565, + "eval_samples_per_second": 14.886, + "eval_wer": 0.409245547328397, + "step": 9680 + }, + { + "epoch": 1.44, + "learning_rate": 9.316023738872405e-06, + "loss": 1.2977, + "step": 9720 + }, + { + "epoch": 1.44, + "eval_loss": 1.268050193786621, + "eval_runtime": 512.2449, + "eval_samples_per_second": 14.913, + "eval_wer": 0.4081305926412991, + "step": 9720 + }, + { + "epoch": 1.44, + "learning_rate": 9.31305637982196e-06, + "loss": 1.2957, + "step": 9760 + }, + { + "epoch": 1.44, + "eval_loss": 1.283426284790039, + "eval_runtime": 511.628, + "eval_samples_per_second": 14.931, + "eval_wer": 0.4097887303810858, + "step": 9760 + }, + { + "epoch": 1.45, + "learning_rate": 9.310089020771514e-06, + "loss": 1.267, + "step": 9800 + }, + { + "epoch": 1.45, + "eval_loss": 1.2938474416732788, + "eval_runtime": 516.6714, + "eval_samples_per_second": 14.785, + "eval_wer": 0.4100174390348495, + "step": 9800 + }, + { + "epoch": 1.45, + "learning_rate": 9.30712166172107e-06, + "loss": 1.2047, + "step": 9840 + }, + { + "epoch": 1.45, + "eval_loss": 1.2899694442749023, + "eval_runtime": 512.2028, + "eval_samples_per_second": 14.914, + "eval_wer": 0.4095028445638812, + "step": 9840 + }, + { + "epoch": 1.46, + "learning_rate": 9.304154302670624e-06, + "loss": 1.2514, + "step": 9880 + }, + { + "epoch": 1.46, + "eval_loss": 1.3348511457443237, + "eval_runtime": 515.2287, + "eval_samples_per_second": 14.826, + "eval_wer": 0.4124188798993682, + "step": 9880 + }, + { + "epoch": 1.47, + "learning_rate": 9.301186943620179e-06, + "loss": 1.3509, + "step": 9920 + }, + { + "epoch": 1.47, + "eval_loss": 1.2478821277618408, + "eval_runtime": 514.987, + "eval_samples_per_second": 14.833, + "eval_wer": 0.40698704937248065, + "step": 9920 + }, + { + "epoch": 1.47, + "learning_rate": 9.298219584569733e-06, + "loss": 1.2415, + "step": 9960 + }, + { + "epoch": 1.47, + "eval_loss": 1.2861199378967285, + "eval_runtime": 512.282, + "eval_samples_per_second": 14.912, + "eval_wer": 0.40918837016495613, + "step": 9960 + }, + { + "epoch": 1.48, + "learning_rate": 9.29525222551929e-06, + "loss": 1.268, + "step": 10000 + }, + { + "epoch": 1.48, + "eval_loss": 1.2546372413635254, + "eval_runtime": 511.9898, + "eval_samples_per_second": 14.92, + "eval_wer": 0.40672975213699647, + "step": 10000 + }, + { + "epoch": 1.48, + "learning_rate": 9.292284866468844e-06, + "loss": 1.2385, + "step": 10040 + }, + { + "epoch": 1.48, + "eval_loss": 1.2831658124923706, + "eval_runtime": 514.9079, + "eval_samples_per_second": 14.836, + "eval_wer": 0.40858800994882644, + "step": 10040 + }, + { + "epoch": 1.49, + "learning_rate": 9.289317507418398e-06, + "loss": 1.2977, + "step": 10080 + }, + { + "epoch": 1.49, + "eval_loss": 1.2325489521026611, + "eval_runtime": 513.672, + "eval_samples_per_second": 14.871, + "eval_wer": 0.4037279510563481, + "step": 10080 + }, + { + "epoch": 1.5, + "learning_rate": 9.286350148367953e-06, + "loss": 1.2312, + "step": 10120 + }, + { + "epoch": 1.5, + "eval_loss": 1.3027517795562744, + "eval_runtime": 512.8506, + "eval_samples_per_second": 14.895, + "eval_wer": 0.40901683867463334, + "step": 10120 + }, + { + "epoch": 1.5, + "learning_rate": 9.283382789317507e-06, + "loss": 1.3768, + "step": 10160 + }, + { + "epoch": 1.5, + "eval_loss": 1.2500500679016113, + "eval_runtime": 517.3558, + "eval_samples_per_second": 14.765, + "eval_wer": 0.4052431458875325, + "step": 10160 + }, + { + "epoch": 1.51, + "learning_rate": 9.280415430267063e-06, + "loss": 1.2225, + "step": 10200 + }, + { + "epoch": 1.51, + "eval_loss": 1.2987366914749146, + "eval_runtime": 514.1854, + "eval_samples_per_second": 14.857, + "eval_wer": 0.40947425598216075, + "step": 10200 + }, + { + "epoch": 1.51, + "learning_rate": 9.277448071216618e-06, + "loss": 1.3326, + "step": 10240 + }, + { + "epoch": 1.51, + "eval_loss": 1.2808113098144531, + "eval_runtime": 512.7928, + "eval_samples_per_second": 14.897, + "eval_wer": 0.40750164384344895, + "step": 10240 + }, + { + "epoch": 1.52, + "learning_rate": 9.274480712166174e-06, + "loss": 1.2844, + "step": 10280 + }, + { + "epoch": 1.52, + "eval_loss": 1.2755920886993408, + "eval_runtime": 513.9899, + "eval_samples_per_second": 14.862, + "eval_wer": 0.40681551788215786, + "step": 10280 + }, + { + "epoch": 1.53, + "learning_rate": 9.271513353115728e-06, + "loss": 1.3656, + "step": 10320 + }, + { + "epoch": 1.53, + "eval_loss": 1.1596375703811646, + "eval_runtime": 515.8418, + "eval_samples_per_second": 14.809, + "eval_wer": 0.39603762257354413, + "step": 10320 + }, + { + "epoch": 1.53, + "learning_rate": 9.268545994065283e-06, + "loss": 1.199, + "step": 10360 + }, + { + "epoch": 1.53, + "eval_loss": 1.266614317893982, + "eval_runtime": 514.0401, + "eval_samples_per_second": 14.861, + "eval_wer": 0.40510020297893023, + "step": 10360 + }, + { + "epoch": 1.54, + "learning_rate": 9.265578635014839e-06, + "loss": 1.4069, + "step": 10400 + }, + { + "epoch": 1.54, + "eval_loss": 1.2308021783828735, + "eval_runtime": 514.5562, + "eval_samples_per_second": 14.846, + "eval_wer": 0.40407101403699364, + "step": 10400 + }, + { + "epoch": 1.54, + "learning_rate": 9.262611275964393e-06, + "loss": 1.254, + "step": 10440 + }, + { + "epoch": 1.54, + "eval_loss": 1.2571922540664673, + "eval_runtime": 514.7648, + "eval_samples_per_second": 14.84, + "eval_wer": 0.4059006832671031, + "step": 10440 + }, + { + "epoch": 1.55, + "learning_rate": 9.259643916913948e-06, + "loss": 1.2367, + "step": 10480 + }, + { + "epoch": 1.55, + "eval_loss": 1.2930080890655518, + "eval_runtime": 513.8769, + "eval_samples_per_second": 14.865, + "eval_wer": 0.4084736556219446, + "step": 10480 + }, + { + "epoch": 1.55, + "learning_rate": 9.256676557863502e-06, + "loss": 1.2301, + "step": 10520 + }, + { + "epoch": 1.55, + "eval_loss": 1.2341119050979614, + "eval_runtime": 515.0285, + "eval_samples_per_second": 14.832, + "eval_wer": 0.4028417050230138, + "step": 10520 + }, + { + "epoch": 1.56, + "learning_rate": 9.253709198813056e-06, + "loss": 1.3147, + "step": 10560 + }, + { + "epoch": 1.56, + "eval_loss": 1.2303303480148315, + "eval_runtime": 514.6134, + "eval_samples_per_second": 14.844, + "eval_wer": 0.40312759084021843, + "step": 10560 + }, + { + "epoch": 1.57, + "learning_rate": 9.250741839762613e-06, + "loss": 1.2585, + "step": 10600 + }, + { + "epoch": 1.57, + "eval_loss": 1.1945106983184814, + "eval_runtime": 514.6525, + "eval_samples_per_second": 14.843, + "eval_wer": 0.3996969610337631, + "step": 10600 + }, + { + "epoch": 1.57, + "learning_rate": 9.247774480712167e-06, + "loss": 1.2957, + "step": 10640 + }, + { + "epoch": 1.57, + "eval_loss": 1.2003751993179321, + "eval_runtime": 515.0689, + "eval_samples_per_second": 14.831, + "eval_wer": 0.4016409845907545, + "step": 10640 + }, + { + "epoch": 1.58, + "learning_rate": 9.244807121661721e-06, + "loss": 1.3104, + "step": 10680 + }, + { + "epoch": 1.58, + "eval_loss": 1.1565747261047363, + "eval_runtime": 514.613, + "eval_samples_per_second": 14.844, + "eval_wer": 0.3986391835101061, + "step": 10680 + }, + { + "epoch": 1.58, + "learning_rate": 9.241839762611276e-06, + "loss": 1.3232, + "step": 10720 + }, + { + "epoch": 1.58, + "eval_loss": 1.1890604496002197, + "eval_runtime": 515.175, + "eval_samples_per_second": 14.828, + "eval_wer": 0.40046885274021554, + "step": 10720 + }, + { + "epoch": 1.59, + "learning_rate": 9.238872403560832e-06, + "loss": 1.2452, + "step": 10760 + }, + { + "epoch": 1.59, + "eval_loss": 1.24032723903656, + "eval_runtime": 515.0885, + "eval_samples_per_second": 14.83, + "eval_wer": 0.404528431344521, + "step": 10760 + }, + { + "epoch": 1.6, + "learning_rate": 9.235905044510387e-06, + "loss": 1.1773, + "step": 10800 + }, + { + "epoch": 1.6, + "eval_loss": 1.2857545614242554, + "eval_runtime": 514.772, + "eval_samples_per_second": 14.84, + "eval_wer": 0.4080448268961377, + "step": 10800 + }, + { + "epoch": 1.6, + "learning_rate": 9.232937685459941e-06, + "loss": 1.2669, + "step": 10840 + }, + { + "epoch": 1.6, + "eval_loss": 1.2499992847442627, + "eval_runtime": 519.9379, + "eval_samples_per_second": 14.692, + "eval_wer": 0.40484290574344606, + "step": 10840 + }, + { + "epoch": 1.61, + "learning_rate": 9.229970326409497e-06, + "loss": 1.3103, + "step": 10880 + }, + { + "epoch": 1.61, + "eval_loss": 1.2001954317092896, + "eval_runtime": 515.0719, + "eval_samples_per_second": 14.831, + "eval_wer": 0.4006689728122588, + "step": 10880 + }, + { + "epoch": 1.61, + "learning_rate": 9.227002967359052e-06, + "loss": 1.2252, + "step": 10920 + }, + { + "epoch": 1.61, + "eval_loss": 1.2275313138961792, + "eval_runtime": 516.3934, + "eval_samples_per_second": 14.793, + "eval_wer": 0.4024986420423683, + "step": 10920 + }, + { + "epoch": 1.62, + "learning_rate": 9.224035608308606e-06, + "loss": 1.2112, + "step": 10960 + }, + { + "epoch": 1.62, + "eval_loss": 1.2510746717453003, + "eval_runtime": 516.5026, + "eval_samples_per_second": 14.79, + "eval_wer": 0.4039566597101118, + "step": 10960 + }, + { + "epoch": 1.63, + "learning_rate": 9.22106824925816e-06, + "loss": 1.2848, + "step": 11000 + }, + { + "epoch": 1.63, + "eval_loss": 1.2750122547149658, + "eval_runtime": 515.8183, + "eval_samples_per_second": 14.809, + "eval_wer": 0.40595786043054405, + "step": 11000 + }, + { + "epoch": 1.63, + "learning_rate": 9.218100890207717e-06, + "loss": 1.3216, + "step": 11040 + }, + { + "epoch": 1.63, + "eval_loss": 1.1478713750839233, + "eval_runtime": 520.3525, + "eval_samples_per_second": 14.68, + "eval_wer": 0.39675233711655566, + "step": 11040 + }, + { + "epoch": 1.64, + "learning_rate": 9.215133531157271e-06, + "loss": 1.2425, + "step": 11080 + }, + { + "epoch": 1.64, + "eval_loss": 1.22694730758667, + "eval_runtime": 516.1758, + "eval_samples_per_second": 14.799, + "eval_wer": 0.40312759084021843, + "step": 11080 + }, + { + "epoch": 1.64, + "learning_rate": 9.212166172106825e-06, + "loss": 1.3123, + "step": 11120 + }, + { + "epoch": 1.64, + "eval_loss": 1.2139358520507812, + "eval_runtime": 515.0839, + "eval_samples_per_second": 14.831, + "eval_wer": 0.40244146487892735, + "step": 11120 + }, + { + "epoch": 1.65, + "learning_rate": 9.20919881305638e-06, + "loss": 1.3536, + "step": 11160 + }, + { + "epoch": 1.65, + "eval_loss": 1.217216968536377, + "eval_runtime": 515.3623, + "eval_samples_per_second": 14.823, + "eval_wer": 0.4025844077875297, + "step": 11160 + }, + { + "epoch": 1.66, + "learning_rate": 9.206231454005934e-06, + "loss": 1.2508, + "step": 11200 + }, + { + "epoch": 1.66, + "eval_loss": 1.1941343545913696, + "eval_runtime": 515.9446, + "eval_samples_per_second": 14.806, + "eval_wer": 0.4000114354326882, + "step": 11200 + }, + { + "epoch": 1.66, + "learning_rate": 9.20326409495549e-06, + "loss": 1.2845, + "step": 11240 + }, + { + "epoch": 1.66, + "eval_loss": 1.2311153411865234, + "eval_runtime": 514.9361, + "eval_samples_per_second": 14.835, + "eval_wer": 0.40235569913376595, + "step": 11240 + }, + { + "epoch": 1.67, + "learning_rate": 9.200296735905045e-06, + "loss": 1.2305, + "step": 11280 + }, + { + "epoch": 1.67, + "eval_loss": 1.1851820945739746, + "eval_runtime": 516.8997, + "eval_samples_per_second": 14.778, + "eval_wer": 0.3988964807455902, + "step": 11280 + }, + { + "epoch": 1.67, + "learning_rate": 9.1973293768546e-06, + "loss": 1.2377, + "step": 11320 + }, + { + "epoch": 1.67, + "eval_loss": 1.2103943824768066, + "eval_runtime": 515.6118, + "eval_samples_per_second": 14.815, + "eval_wer": 0.4002115555047314, + "step": 11320 + }, + { + "epoch": 1.68, + "learning_rate": 9.194362017804155e-06, + "loss": 1.3146, + "step": 11360 + }, + { + "epoch": 1.68, + "eval_loss": 1.1271100044250488, + "eval_runtime": 514.652, + "eval_samples_per_second": 14.843, + "eval_wer": 0.3947225478144029, + "step": 11360 + }, + { + "epoch": 1.69, + "learning_rate": 9.19139465875371e-06, + "loss": 1.2701, + "step": 11400 + }, + { + "epoch": 1.69, + "eval_loss": 1.1794366836547852, + "eval_runtime": 514.8999, + "eval_samples_per_second": 14.836, + "eval_wer": 0.3988964807455902, + "step": 11400 + }, + { + "epoch": 1.69, + "learning_rate": 9.188427299703266e-06, + "loss": 1.3691, + "step": 11440 + }, + { + "epoch": 1.69, + "eval_loss": 1.1657973527908325, + "eval_runtime": 519.8883, + "eval_samples_per_second": 14.694, + "eval_wer": 0.39718116584236257, + "step": 11440 + }, + { + "epoch": 1.7, + "learning_rate": 9.18545994065282e-06, + "loss": 1.2245, + "step": 11480 + }, + { + "epoch": 1.7, + "eval_loss": 1.3082857131958008, + "eval_runtime": 515.8967, + "eval_samples_per_second": 14.807, + "eval_wer": 0.4099316732896881, + "step": 11480 + }, + { + "epoch": 1.7, + "learning_rate": 9.182492581602375e-06, + "loss": 1.3501, + "step": 11520 + }, + { + "epoch": 1.7, + "eval_loss": 1.1687225103378296, + "eval_runtime": 515.5136, + "eval_samples_per_second": 14.818, + "eval_wer": 0.39703822293376023, + "step": 11520 + }, + { + "epoch": 1.71, + "learning_rate": 9.17952522255193e-06, + "loss": 1.2943, + "step": 11560 + }, + { + "epoch": 1.71, + "eval_loss": 1.2141493558883667, + "eval_runtime": 514.6303, + "eval_samples_per_second": 14.844, + "eval_wer": 0.40041167557677465, + "step": 11560 + }, + { + "epoch": 1.71, + "learning_rate": 9.176557863501484e-06, + "loss": 1.288, + "step": 11600 + }, + { + "epoch": 1.71, + "eval_loss": 1.1936476230621338, + "eval_runtime": 514.4918, + "eval_samples_per_second": 14.848, + "eval_wer": 0.39818176620257867, + "step": 11600 + }, + { + "epoch": 1.72, + "learning_rate": 9.17359050445104e-06, + "loss": 1.285, + "step": 11640 + }, + { + "epoch": 1.72, + "eval_loss": 1.1829966306686401, + "eval_runtime": 515.1035, + "eval_samples_per_second": 14.83, + "eval_wer": 0.3971525772606421, + "step": 11640 + }, + { + "epoch": 1.73, + "learning_rate": 9.170623145400594e-06, + "loss": 1.2059, + "step": 11680 + }, + { + "epoch": 1.73, + "eval_loss": 1.2137354612350464, + "eval_runtime": 519.0409, + "eval_samples_per_second": 14.718, + "eval_wer": 0.39938248663483805, + "step": 11680 + }, + { + "epoch": 1.73, + "learning_rate": 9.167655786350149e-06, + "loss": 1.1926, + "step": 11720 + }, + { + "epoch": 1.73, + "eval_loss": 1.209702491760254, + "eval_runtime": 514.9115, + "eval_samples_per_second": 14.836, + "eval_wer": 0.3996397838703222, + "step": 11720 + }, + { + "epoch": 1.74, + "learning_rate": 9.164688427299703e-06, + "loss": 1.279, + "step": 11760 + }, + { + "epoch": 1.74, + "eval_loss": 1.2162266969680786, + "eval_runtime": 514.3955, + "eval_samples_per_second": 14.85, + "eval_wer": 0.4010120357929043, + "step": 11760 + }, + { + "epoch": 1.74, + "learning_rate": 9.161721068249258e-06, + "loss": 1.2614, + "step": 11800 + }, + { + "epoch": 1.74, + "eval_loss": 1.2356311082839966, + "eval_runtime": 514.6584, + "eval_samples_per_second": 14.843, + "eval_wer": 0.4027559392778524, + "step": 11800 + }, + { + "epoch": 1.75, + "learning_rate": 9.158753709198814e-06, + "loss": 1.2234, + "step": 11840 + }, + { + "epoch": 1.75, + "eval_loss": 1.2179203033447266, + "eval_runtime": 516.174, + "eval_samples_per_second": 14.799, + "eval_wer": 0.3995826067068813, + "step": 11840 + }, + { + "epoch": 1.76, + "learning_rate": 9.155786350148368e-06, + "loss": 1.246, + "step": 11880 + }, + { + "epoch": 1.76, + "eval_loss": 1.2087491750717163, + "eval_runtime": 515.5898, + "eval_samples_per_second": 14.816, + "eval_wer": 0.39818176620257867, + "step": 11880 + }, + { + "epoch": 1.76, + "learning_rate": 9.152818991097924e-06, + "loss": 1.2865, + "step": 11920 + }, + { + "epoch": 1.76, + "eval_loss": 1.1791400909423828, + "eval_runtime": 515.7846, + "eval_samples_per_second": 14.81, + "eval_wer": 0.396523628462792, + "step": 11920 + }, + { + "epoch": 1.77, + "learning_rate": 9.149851632047479e-06, + "loss": 1.2409, + "step": 11960 + }, + { + "epoch": 1.77, + "eval_loss": 1.1861945390701294, + "eval_runtime": 514.5033, + "eval_samples_per_second": 14.847, + "eval_wer": 0.39620915406386686, + "step": 11960 + }, + { + "epoch": 1.77, + "learning_rate": 9.146884272997033e-06, + "loss": 1.2177, + "step": 12000 + }, + { + "epoch": 1.77, + "eval_loss": 1.2645891904830933, + "eval_runtime": 515.0621, + "eval_samples_per_second": 14.831, + "eval_wer": 0.40289888218645475, + "step": 12000 + }, + { + "epoch": 1.78, + "learning_rate": 9.143916913946588e-06, + "loss": 1.2715, + "step": 12040 + }, + { + "epoch": 1.78, + "eval_loss": 1.1953966617584229, + "eval_runtime": 514.3882, + "eval_samples_per_second": 14.851, + "eval_wer": 0.3956373824294577, + "step": 12040 + }, + { + "epoch": 1.79, + "learning_rate": 9.140949554896144e-06, + "loss": 1.3551, + "step": 12080 + }, + { + "epoch": 1.79, + "eval_loss": 1.1641371250152588, + "eval_runtime": 519.7734, + "eval_samples_per_second": 14.697, + "eval_wer": 0.3949512564681666, + "step": 12080 + }, + { + "epoch": 1.79, + "learning_rate": 9.137982195845698e-06, + "loss": 1.305, + "step": 12120 + }, + { + "epoch": 1.79, + "eval_loss": 1.1996777057647705, + "eval_runtime": 513.9019, + "eval_samples_per_second": 14.865, + "eval_wer": 0.397953057548815, + "step": 12120 + }, + { + "epoch": 1.8, + "learning_rate": 9.135014836795253e-06, + "loss": 1.2813, + "step": 12160 + }, + { + "epoch": 1.8, + "eval_loss": 1.168097734451294, + "eval_runtime": 514.743, + "eval_samples_per_second": 14.84, + "eval_wer": 0.39623774264558737, + "step": 12160 + }, + { + "epoch": 1.8, + "learning_rate": 9.132047477744807e-06, + "loss": 1.2227, + "step": 12200 + }, + { + "epoch": 1.8, + "eval_loss": 1.1406610012054443, + "eval_runtime": 520.5862, + "eval_samples_per_second": 14.674, + "eval_wer": 0.3927785242574116, + "step": 12200 + }, + { + "epoch": 1.81, + "learning_rate": 9.129080118694362e-06, + "loss": 1.2228, + "step": 12240 + }, + { + "epoch": 1.81, + "eval_loss": 1.2118908166885376, + "eval_runtime": 516.513, + "eval_samples_per_second": 14.79, + "eval_wer": 0.39801023471225594, + "step": 12240 + }, + { + "epoch": 1.82, + "learning_rate": 9.126112759643918e-06, + "loss": 1.2309, + "step": 12280 + }, + { + "epoch": 1.82, + "eval_loss": 1.2271971702575684, + "eval_runtime": 514.5095, + "eval_samples_per_second": 14.847, + "eval_wer": 0.39955401812516084, + "step": 12280 + }, + { + "epoch": 1.82, + "learning_rate": 9.123145400593472e-06, + "loss": 1.2576, + "step": 12320 + }, + { + "epoch": 1.82, + "eval_loss": 1.1513153314590454, + "eval_runtime": 516.4265, + "eval_samples_per_second": 14.792, + "eval_wer": 0.39315017581977757, + "step": 12320 + }, + { + "epoch": 1.83, + "learning_rate": 9.120178041543027e-06, + "loss": 1.2694, + "step": 12360 + }, + { + "epoch": 1.83, + "eval_loss": 1.2082685232162476, + "eval_runtime": 514.6625, + "eval_samples_per_second": 14.843, + "eval_wer": 0.39806741187569683, + "step": 12360 + }, + { + "epoch": 1.83, + "learning_rate": 9.117210682492583e-06, + "loss": 1.2862, + "step": 12400 + }, + { + "epoch": 1.83, + "eval_loss": 1.1853402853012085, + "eval_runtime": 514.4975, + "eval_samples_per_second": 14.847, + "eval_wer": 0.3966379827896738, + "step": 12400 + }, + { + "epoch": 1.84, + "learning_rate": 9.114243323442137e-06, + "loss": 1.2195, + "step": 12440 + }, + { + "epoch": 1.84, + "eval_loss": 1.2082812786102295, + "eval_runtime": 514.1893, + "eval_samples_per_second": 14.856, + "eval_wer": 0.39843906343806285, + "step": 12440 + }, + { + "epoch": 1.84, + "learning_rate": 9.111275964391693e-06, + "loss": 1.2743, + "step": 12480 + }, + { + "epoch": 1.84, + "eval_loss": 1.175351619720459, + "eval_runtime": 518.3681, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3966379827896738, + "step": 12480 + }, + { + "epoch": 1.85, + "learning_rate": 9.108308605341248e-06, + "loss": 1.1761, + "step": 12520 + }, + { + "epoch": 1.85, + "eval_loss": 1.233346700668335, + "eval_runtime": 514.5119, + "eval_samples_per_second": 14.847, + "eval_wer": 0.4001543783412905, + "step": 12520 + }, + { + "epoch": 1.86, + "learning_rate": 9.105341246290802e-06, + "loss": 1.2218, + "step": 12560 + }, + { + "epoch": 1.86, + "eval_loss": 1.237270712852478, + "eval_runtime": 514.5013, + "eval_samples_per_second": 14.847, + "eval_wer": 0.4006689728122588, + "step": 12560 + }, + { + "epoch": 1.86, + "learning_rate": 9.102373887240357e-06, + "loss": 1.2488, + "step": 12600 + }, + { + "epoch": 1.86, + "eval_loss": 1.1729488372802734, + "eval_runtime": 515.1424, + "eval_samples_per_second": 14.829, + "eval_wer": 0.39435089625203695, + "step": 12600 + }, + { + "epoch": 1.87, + "learning_rate": 9.099406528189911e-06, + "loss": 1.2397, + "step": 12640 + }, + { + "epoch": 1.87, + "eval_loss": 1.1414551734924316, + "eval_runtime": 515.7448, + "eval_samples_per_second": 14.812, + "eval_wer": 0.39069155779181797, + "step": 12640 + }, + { + "epoch": 1.87, + "learning_rate": 9.096439169139467e-06, + "loss": 1.2579, + "step": 12680 + }, + { + "epoch": 1.87, + "eval_loss": 1.2156543731689453, + "eval_runtime": 514.923, + "eval_samples_per_second": 14.835, + "eval_wer": 0.3973526973326853, + "step": 12680 + }, + { + "epoch": 1.88, + "learning_rate": 9.093471810089022e-06, + "loss": 1.2884, + "step": 12720 + }, + { + "epoch": 1.88, + "eval_loss": 1.2026344537734985, + "eval_runtime": 516.6667, + "eval_samples_per_second": 14.785, + "eval_wer": 0.39675233711655566, + "step": 12720 + }, + { + "epoch": 1.89, + "learning_rate": 9.090504451038576e-06, + "loss": 1.2407, + "step": 12760 + }, + { + "epoch": 1.89, + "eval_loss": 1.2206709384918213, + "eval_runtime": 513.8178, + "eval_samples_per_second": 14.867, + "eval_wer": 0.39783870322193315, + "step": 12760 + }, + { + "epoch": 1.89, + "learning_rate": 9.08753709198813e-06, + "loss": 1.2793, + "step": 12800 + }, + { + "epoch": 1.89, + "eval_loss": 1.1325563192367554, + "eval_runtime": 515.4127, + "eval_samples_per_second": 14.821, + "eval_wer": 0.39200663255095913, + "step": 12800 + }, + { + "epoch": 1.9, + "learning_rate": 9.084569732937685e-06, + "loss": 1.2156, + "step": 12840 + }, + { + "epoch": 1.9, + "eval_loss": 1.1944189071655273, + "eval_runtime": 515.699, + "eval_samples_per_second": 14.813, + "eval_wer": 0.39538008519397355, + "step": 12840 + }, + { + "epoch": 1.9, + "learning_rate": 9.081602373887241e-06, + "loss": 1.233, + "step": 12880 + }, + { + "epoch": 1.9, + "eval_loss": 1.1567288637161255, + "eval_runtime": 519.3504, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3923496955316047, + "step": 12880 + }, + { + "epoch": 1.91, + "learning_rate": 9.078635014836796e-06, + "loss": 1.2187, + "step": 12920 + }, + { + "epoch": 1.91, + "eval_loss": 1.2292488813400269, + "eval_runtime": 514.3211, + "eval_samples_per_second": 14.853, + "eval_wer": 0.3977243488950513, + "step": 12920 + }, + { + "epoch": 1.92, + "learning_rate": 9.075667655786352e-06, + "loss": 1.2503, + "step": 12960 + }, + { + "epoch": 1.92, + "eval_loss": 1.1655694246292114, + "eval_runtime": 514.7204, + "eval_samples_per_second": 14.841, + "eval_wer": 0.3933502958918208, + "step": 12960 + }, + { + "epoch": 1.92, + "learning_rate": 9.072700296735906e-06, + "loss": 1.2253, + "step": 13000 + }, + { + "epoch": 1.92, + "eval_loss": 1.1394695043563843, + "eval_runtime": 519.5022, + "eval_samples_per_second": 14.704, + "eval_wer": 0.3910917979359044, + "step": 13000 + }, + { + "epoch": 1.93, + "learning_rate": 9.06973293768546e-06, + "loss": 1.277, + "step": 13040 + }, + { + "epoch": 1.93, + "eval_loss": 1.178635597229004, + "eval_runtime": 515.4564, + "eval_samples_per_second": 14.82, + "eval_wer": 0.3931215872380571, + "step": 13040 + }, + { + "epoch": 1.93, + "learning_rate": 9.066765578635015e-06, + "loss": 1.2246, + "step": 13080 + }, + { + "epoch": 1.93, + "eval_loss": 1.166589379310608, + "eval_runtime": 514.81, + "eval_samples_per_second": 14.838, + "eval_wer": 0.3924068726950456, + "step": 13080 + }, + { + "epoch": 1.94, + "learning_rate": 9.063798219584571e-06, + "loss": 1.3, + "step": 13120 + }, + { + "epoch": 1.94, + "eval_loss": 1.1885249614715576, + "eval_runtime": 515.2189, + "eval_samples_per_second": 14.827, + "eval_wer": 0.3940364218531119, + "step": 13120 + }, + { + "epoch": 1.95, + "learning_rate": 9.060830860534126e-06, + "loss": 1.1914, + "step": 13160 + }, + { + "epoch": 1.95, + "eval_loss": 1.2117103338241577, + "eval_runtime": 515.423, + "eval_samples_per_second": 14.821, + "eval_wer": 0.3964950398810715, + "step": 13160 + }, + { + "epoch": 1.95, + "learning_rate": 9.05786350148368e-06, + "loss": 1.2394, + "step": 13200 + }, + { + "epoch": 1.95, + "eval_loss": 1.168739914894104, + "eval_runtime": 516.4092, + "eval_samples_per_second": 14.793, + "eval_wer": 0.39406501043483233, + "step": 13200 + }, + { + "epoch": 1.96, + "learning_rate": 9.054896142433235e-06, + "loss": 1.2302, + "step": 13240 + }, + { + "epoch": 1.96, + "eval_loss": 1.2200406789779663, + "eval_runtime": 516.295, + "eval_samples_per_second": 14.796, + "eval_wer": 0.3980388232939764, + "step": 13240 + }, + { + "epoch": 1.96, + "learning_rate": 9.051928783382789e-06, + "loss": 1.2483, + "step": 13280 + }, + { + "epoch": 1.96, + "eval_loss": 1.1558986902236938, + "eval_runtime": 516.1105, + "eval_samples_per_second": 14.801, + "eval_wer": 0.39297864432945484, + "step": 13280 + }, + { + "epoch": 1.97, + "learning_rate": 9.048961424332345e-06, + "loss": 1.2716, + "step": 13320 + }, + { + "epoch": 1.97, + "eval_loss": 1.2075449228286743, + "eval_runtime": 514.9105, + "eval_samples_per_second": 14.836, + "eval_wer": 0.39792446896709455, + "step": 13320 + }, + { + "epoch": 1.97, + "learning_rate": 9.0459940652819e-06, + "loss": 1.2013, + "step": 13360 + }, + { + "epoch": 1.97, + "eval_loss": 1.2613040208816528, + "eval_runtime": 515.4434, + "eval_samples_per_second": 14.82, + "eval_wer": 0.4017553389176363, + "step": 13360 + }, + { + "epoch": 1.98, + "learning_rate": 9.043026706231454e-06, + "loss": 1.2439, + "step": 13400 + }, + { + "epoch": 1.98, + "eval_loss": 1.2378604412078857, + "eval_runtime": 517.4479, + "eval_samples_per_second": 14.763, + "eval_wer": 0.4002973212498928, + "step": 13400 + }, + { + "epoch": 1.99, + "learning_rate": 9.04005934718101e-06, + "loss": 1.302, + "step": 13440 + }, + { + "epoch": 1.99, + "eval_loss": 1.1117513179779053, + "eval_runtime": 514.4198, + "eval_samples_per_second": 14.85, + "eval_wer": 0.38886188856170845, + "step": 13440 + }, + { + "epoch": 1.99, + "learning_rate": 9.037091988130565e-06, + "loss": 1.2044, + "step": 13480 + }, + { + "epoch": 1.99, + "eval_loss": 1.1643050909042358, + "eval_runtime": 514.7147, + "eval_samples_per_second": 14.841, + "eval_wer": 0.39172074673375457, + "step": 13480 + }, + { + "epoch": 2.0, + "learning_rate": 9.034124629080119e-06, + "loss": 1.2368, + "step": 13520 + }, + { + "epoch": 2.0, + "eval_loss": 1.1926770210266113, + "eval_runtime": 514.804, + "eval_samples_per_second": 14.839, + "eval_wer": 0.3945224277423597, + "step": 13520 + }, + { + "epoch": 2.0, + "learning_rate": 9.031157270029675e-06, + "loss": 1.2034, + "step": 13560 + }, + { + "epoch": 2.0, + "eval_loss": 1.2277581691741943, + "eval_runtime": 511.5394, + "eval_samples_per_second": 14.933, + "eval_wer": 0.39732410875096486, + "step": 13560 + }, + { + "epoch": 2.01, + "learning_rate": 9.02818991097923e-06, + "loss": 1.3293, + "step": 13600 + }, + { + "epoch": 2.01, + "eval_loss": 1.1324790716171265, + "eval_runtime": 512.754, + "eval_samples_per_second": 14.898, + "eval_wer": 0.3902913176477315, + "step": 13600 + }, + { + "epoch": 2.02, + "learning_rate": 9.025222551928784e-06, + "loss": 1.2176, + "step": 13640 + }, + { + "epoch": 2.02, + "eval_loss": 1.1624653339385986, + "eval_runtime": 512.412, + "eval_samples_per_second": 14.908, + "eval_wer": 0.3930072329111753, + "step": 13640 + }, + { + "epoch": 2.02, + "learning_rate": 9.022255192878339e-06, + "loss": 1.1786, + "step": 13680 + }, + { + "epoch": 2.02, + "eval_loss": 1.1658124923706055, + "eval_runtime": 514.2146, + "eval_samples_per_second": 14.856, + "eval_wer": 0.3932645301466594, + "step": 13680 + }, + { + "epoch": 2.03, + "learning_rate": 9.019287833827895e-06, + "loss": 1.2508, + "step": 13720 + }, + { + "epoch": 2.03, + "eval_loss": 1.222221851348877, + "eval_runtime": 514.3863, + "eval_samples_per_second": 14.851, + "eval_wer": 0.39755281740472853, + "step": 13720 + }, + { + "epoch": 2.03, + "learning_rate": 9.016320474777449e-06, + "loss": 1.2972, + "step": 13760 + }, + { + "epoch": 2.03, + "eval_loss": 1.1103342771530151, + "eval_runtime": 514.9599, + "eval_samples_per_second": 14.834, + "eval_wer": 0.3885474141627834, + "step": 13760 + }, + { + "epoch": 2.04, + "learning_rate": 9.013353115727004e-06, + "loss": 1.2627, + "step": 13800 + }, + { + "epoch": 2.04, + "eval_loss": 1.2215102910995483, + "eval_runtime": 513.1472, + "eval_samples_per_second": 14.887, + "eval_wer": 0.39672374853483516, + "step": 13800 + }, + { + "epoch": 2.05, + "learning_rate": 9.010385756676558e-06, + "loss": 1.2212, + "step": 13840 + }, + { + "epoch": 2.05, + "eval_loss": 1.1900132894515991, + "eval_runtime": 518.6245, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3942079533434346, + "step": 13840 + }, + { + "epoch": 2.05, + "learning_rate": 9.007418397626112e-06, + "loss": 1.1978, + "step": 13880 + }, + { + "epoch": 2.05, + "eval_loss": 1.216287612915039, + "eval_runtime": 513.2097, + "eval_samples_per_second": 14.885, + "eval_wer": 0.3952371422853712, + "step": 13880 + }, + { + "epoch": 2.06, + "learning_rate": 9.004451038575669e-06, + "loss": 1.2258, + "step": 13920 + }, + { + "epoch": 2.06, + "eval_loss": 1.2070460319519043, + "eval_runtime": 514.4057, + "eval_samples_per_second": 14.85, + "eval_wer": 0.3945510163240802, + "step": 13920 + }, + { + "epoch": 2.06, + "learning_rate": 9.001483679525223e-06, + "loss": 1.32, + "step": 13960 + }, + { + "epoch": 2.06, + "eval_loss": 1.1560930013656616, + "eval_runtime": 515.8608, + "eval_samples_per_second": 14.808, + "eval_wer": 0.3900911975756883, + "step": 13960 + }, + { + "epoch": 2.07, + "learning_rate": 8.998516320474779e-06, + "loss": 1.1321, + "step": 14000 + }, + { + "epoch": 2.07, + "eval_loss": 1.2391009330749512, + "eval_runtime": 512.8727, + "eval_samples_per_second": 14.895, + "eval_wer": 0.39723834300580346, + "step": 14000 + }, + { + "epoch": 2.08, + "learning_rate": 8.995548961424334e-06, + "loss": 1.1845, + "step": 14040 + }, + { + "epoch": 2.08, + "eval_loss": 1.2508766651153564, + "eval_runtime": 512.8212, + "eval_samples_per_second": 14.896, + "eval_wer": 0.39821035478429917, + "step": 14040 + }, + { + "epoch": 2.08, + "learning_rate": 8.992581602373888e-06, + "loss": 1.2097, + "step": 14080 + }, + { + "epoch": 2.08, + "eval_loss": 1.2427051067352295, + "eval_runtime": 516.0232, + "eval_samples_per_second": 14.804, + "eval_wer": 0.3984676520197833, + "step": 14080 + }, + { + "epoch": 2.09, + "learning_rate": 8.989614243323442e-06, + "loss": 1.2673, + "step": 14120 + }, + { + "epoch": 2.09, + "eval_loss": 1.265183925628662, + "eval_runtime": 513.1316, + "eval_samples_per_second": 14.887, + "eval_wer": 0.4006689728122588, + "step": 14120 + }, + { + "epoch": 2.09, + "learning_rate": 8.986646884272999e-06, + "loss": 1.1522, + "step": 14160 + }, + { + "epoch": 2.09, + "eval_loss": 1.2947725057601929, + "eval_runtime": 514.3237, + "eval_samples_per_second": 14.853, + "eval_wer": 0.40289888218645475, + "step": 14160 + }, + { + "epoch": 2.1, + "learning_rate": 8.983679525222553e-06, + "loss": 1.1791, + "step": 14200 + }, + { + "epoch": 2.1, + "eval_loss": 1.215259313583374, + "eval_runtime": 517.3217, + "eval_samples_per_second": 14.766, + "eval_wer": 0.39526573086709166, + "step": 14200 + }, + { + "epoch": 2.1, + "learning_rate": 8.980712166172107e-06, + "loss": 1.1987, + "step": 14240 + }, + { + "epoch": 2.1, + "eval_loss": 1.2145788669586182, + "eval_runtime": 513.6121, + "eval_samples_per_second": 14.873, + "eval_wer": 0.39477972497784386, + "step": 14240 + }, + { + "epoch": 2.11, + "learning_rate": 8.977744807121662e-06, + "loss": 1.1898, + "step": 14280 + }, + { + "epoch": 2.11, + "eval_loss": 1.248544692993164, + "eval_runtime": 514.2304, + "eval_samples_per_second": 14.855, + "eval_wer": 0.39852482918322424, + "step": 14280 + }, + { + "epoch": 2.12, + "learning_rate": 8.974777448071216e-06, + "loss": 1.1876, + "step": 14320 + }, + { + "epoch": 2.12, + "eval_loss": 1.1694121360778809, + "eval_runtime": 513.0559, + "eval_samples_per_second": 14.889, + "eval_wer": 0.3925784041853684, + "step": 14320 + }, + { + "epoch": 2.12, + "learning_rate": 8.971810089020773e-06, + "loss": 1.2031, + "step": 14360 + }, + { + "epoch": 2.12, + "eval_loss": 1.2123262882232666, + "eval_runtime": 513.0034, + "eval_samples_per_second": 14.891, + "eval_wer": 0.3949512564681666, + "step": 14360 + }, + { + "epoch": 2.13, + "learning_rate": 8.968842729970327e-06, + "loss": 1.3011, + "step": 14400 + }, + { + "epoch": 2.13, + "eval_loss": 1.1513561010360718, + "eval_runtime": 513.6034, + "eval_samples_per_second": 14.873, + "eval_wer": 0.3908059121186998, + "step": 14400 + }, + { + "epoch": 2.13, + "learning_rate": 8.965875370919881e-06, + "loss": 1.2273, + "step": 14440 + }, + { + "epoch": 2.13, + "eval_loss": 1.1705405712127686, + "eval_runtime": 516.8255, + "eval_samples_per_second": 14.781, + "eval_wer": 0.3915778038251522, + "step": 14440 + }, + { + "epoch": 2.14, + "learning_rate": 8.962908011869438e-06, + "loss": 1.2064, + "step": 14480 + }, + { + "epoch": 2.14, + "eval_loss": 1.1850563287734985, + "eval_runtime": 513.2674, + "eval_samples_per_second": 14.883, + "eval_wer": 0.3918065124789159, + "step": 14480 + }, + { + "epoch": 2.15, + "learning_rate": 8.959940652818992e-06, + "loss": 1.204, + "step": 14520 + }, + { + "epoch": 2.15, + "eval_loss": 1.2443561553955078, + "eval_runtime": 512.4476, + "eval_samples_per_second": 14.907, + "eval_wer": 0.39718116584236257, + "step": 14520 + }, + { + "epoch": 2.15, + "learning_rate": 8.956973293768546e-06, + "loss": 1.2153, + "step": 14560 + }, + { + "epoch": 2.15, + "eval_loss": 1.1515636444091797, + "eval_runtime": 516.4564, + "eval_samples_per_second": 14.791, + "eval_wer": 0.3897767231767632, + "step": 14560 + }, + { + "epoch": 2.16, + "learning_rate": 8.954005934718103e-06, + "loss": 1.2881, + "step": 14600 + }, + { + "epoch": 2.16, + "eval_loss": 1.1857043504714966, + "eval_runtime": 513.9778, + "eval_samples_per_second": 14.863, + "eval_wer": 0.3926069927670888, + "step": 14600 + }, + { + "epoch": 2.16, + "learning_rate": 8.951038575667657e-06, + "loss": 1.186, + "step": 14640 + }, + { + "epoch": 2.16, + "eval_loss": 1.1939418315887451, + "eval_runtime": 515.0056, + "eval_samples_per_second": 14.833, + "eval_wer": 0.39303582149289573, + "step": 14640 + }, + { + "epoch": 2.17, + "learning_rate": 8.948071216617211e-06, + "loss": 1.1952, + "step": 14680 + }, + { + "epoch": 2.17, + "eval_loss": 1.1353286504745483, + "eval_runtime": 514.5552, + "eval_samples_per_second": 14.846, + "eval_wer": 0.3884902369993425, + "step": 14680 + }, + { + "epoch": 2.18, + "learning_rate": 8.945103857566766e-06, + "loss": 1.2119, + "step": 14720 + }, + { + "epoch": 2.18, + "eval_loss": 1.2173880338668823, + "eval_runtime": 517.3615, + "eval_samples_per_second": 14.765, + "eval_wer": 0.39397924468967094, + "step": 14720 + }, + { + "epoch": 2.18, + "learning_rate": 8.942136498516322e-06, + "loss": 1.1097, + "step": 14760 + }, + { + "epoch": 2.18, + "eval_loss": 1.237266182899475, + "eval_runtime": 517.2333, + "eval_samples_per_second": 14.769, + "eval_wer": 0.3950656107950485, + "step": 14760 + }, + { + "epoch": 2.19, + "learning_rate": 8.939169139465876e-06, + "loss": 1.1622, + "step": 14800 + }, + { + "epoch": 2.19, + "eval_loss": 1.2398948669433594, + "eval_runtime": 515.4061, + "eval_samples_per_second": 14.821, + "eval_wer": 0.39500843363160754, + "step": 14800 + }, + { + "epoch": 2.19, + "learning_rate": 8.936201780415431e-06, + "loss": 1.1339, + "step": 14840 + }, + { + "epoch": 2.19, + "eval_loss": 1.2222470045089722, + "eval_runtime": 514.7182, + "eval_samples_per_second": 14.841, + "eval_wer": 0.3927499356756911, + "step": 14840 + }, + { + "epoch": 2.2, + "learning_rate": 8.933234421364985e-06, + "loss": 1.1469, + "step": 14880 + }, + { + "epoch": 2.2, + "eval_loss": 1.2348510026931763, + "eval_runtime": 515.4744, + "eval_samples_per_second": 14.819, + "eval_wer": 0.39375053603590726, + "step": 14880 + }, + { + "epoch": 2.21, + "learning_rate": 8.93026706231454e-06, + "loss": 1.222, + "step": 14920 + }, + { + "epoch": 2.21, + "eval_loss": 1.166113018989563, + "eval_runtime": 513.7354, + "eval_samples_per_second": 14.87, + "eval_wer": 0.3882329397638583, + "step": 14920 + }, + { + "epoch": 2.21, + "learning_rate": 8.927299703264096e-06, + "loss": 1.2914, + "step": 14960 + }, + { + "epoch": 2.21, + "eval_loss": 1.1017524003982544, + "eval_runtime": 513.5751, + "eval_samples_per_second": 14.874, + "eval_wer": 0.3823436919294434, + "step": 14960 + }, + { + "epoch": 2.22, + "learning_rate": 8.92433234421365e-06, + "loss": 1.1736, + "step": 15000 + }, + { + "epoch": 2.22, + "eval_loss": 1.204420566558838, + "eval_runtime": 513.4936, + "eval_samples_per_second": 14.877, + "eval_wer": 0.38946224877783814, + "step": 15000 + }, + { + "epoch": 2.22, + "learning_rate": 8.921364985163205e-06, + "loss": 1.2127, + "step": 15040 + }, + { + "epoch": 2.22, + "eval_loss": 1.1424169540405273, + "eval_runtime": 518.8689, + "eval_samples_per_second": 14.722, + "eval_wer": 0.3849738414477258, + "step": 15040 + }, + { + "epoch": 2.23, + "learning_rate": 8.918397626112761e-06, + "loss": 1.1745, + "step": 15080 + }, + { + "epoch": 2.23, + "eval_loss": 1.2061676979064941, + "eval_runtime": 514.6415, + "eval_samples_per_second": 14.843, + "eval_wer": 0.3894908373595586, + "step": 15080 + }, + { + "epoch": 2.24, + "learning_rate": 8.915430267062315e-06, + "loss": 1.2359, + "step": 15120 + }, + { + "epoch": 2.24, + "eval_loss": 1.16087007522583, + "eval_runtime": 514.5305, + "eval_samples_per_second": 14.847, + "eval_wer": 0.38640327053374884, + "step": 15120 + }, + { + "epoch": 2.24, + "learning_rate": 8.91246290801187e-06, + "loss": 1.2219, + "step": 15160 + }, + { + "epoch": 2.24, + "eval_loss": 1.1447373628616333, + "eval_runtime": 519.9867, + "eval_samples_per_second": 14.691, + "eval_wer": 0.38494525286600534, + "step": 15160 + }, + { + "epoch": 2.25, + "learning_rate": 8.909495548961426e-06, + "loss": 1.2052, + "step": 15200 + }, + { + "epoch": 2.25, + "eval_loss": 1.1689306497573853, + "eval_runtime": 514.0595, + "eval_samples_per_second": 14.86, + "eval_wer": 0.3872037508219217, + "step": 15200 + }, + { + "epoch": 2.25, + "learning_rate": 8.90652818991098e-06, + "loss": 1.2245, + "step": 15240 + }, + { + "epoch": 2.25, + "eval_loss": 1.1655718088150024, + "eval_runtime": 516.0181, + "eval_samples_per_second": 14.804, + "eval_wer": 0.38786128820149235, + "step": 15240 + }, + { + "epoch": 2.26, + "learning_rate": 8.903560830860535e-06, + "loss": 1.2552, + "step": 15280 + }, + { + "epoch": 2.26, + "eval_loss": 1.1559613943099976, + "eval_runtime": 515.8973, + "eval_samples_per_second": 14.807, + "eval_wer": 0.3873752823122445, + "step": 15280 + }, + { + "epoch": 2.26, + "learning_rate": 8.90059347181009e-06, + "loss": 1.2728, + "step": 15320 + }, + { + "epoch": 2.26, + "eval_loss": 1.1153063774108887, + "eval_runtime": 514.4347, + "eval_samples_per_second": 14.849, + "eval_wer": 0.38374453243374596, + "step": 15320 + }, + { + "epoch": 2.27, + "learning_rate": 8.897626112759644e-06, + "loss": 1.2461, + "step": 15360 + }, + { + "epoch": 2.27, + "eval_loss": 1.1778333187103271, + "eval_runtime": 513.397, + "eval_samples_per_second": 14.879, + "eval_wer": 0.3889762428885903, + "step": 15360 + }, + { + "epoch": 2.28, + "learning_rate": 8.8946587537092e-06, + "loss": 1.2111, + "step": 15400 + }, + { + "epoch": 2.28, + "eval_loss": 1.178096055984497, + "eval_runtime": 515.5018, + "eval_samples_per_second": 14.819, + "eval_wer": 0.39014837473912917, + "step": 15400 + }, + { + "epoch": 2.28, + "learning_rate": 8.891691394658754e-06, + "loss": 1.2413, + "step": 15440 + }, + { + "epoch": 2.28, + "eval_loss": 1.1333427429199219, + "eval_runtime": 513.8433, + "eval_samples_per_second": 14.866, + "eval_wer": 0.3861173847165442, + "step": 15440 + }, + { + "epoch": 2.29, + "learning_rate": 8.888724035608309e-06, + "loss": 1.1375, + "step": 15480 + }, + { + "epoch": 2.29, + "eval_loss": 1.201409101486206, + "eval_runtime": 513.2721, + "eval_samples_per_second": 14.883, + "eval_wer": 0.39003402041224733, + "step": 15480 + }, + { + "epoch": 2.29, + "learning_rate": 8.885756676557863e-06, + "loss": 1.2674, + "step": 15520 + }, + { + "epoch": 2.29, + "eval_loss": 1.1463115215301514, + "eval_runtime": 514.5134, + "eval_samples_per_second": 14.847, + "eval_wer": 0.38586008748106004, + "step": 15520 + }, + { + "epoch": 2.3, + "learning_rate": 8.88278931750742e-06, + "loss": 1.2618, + "step": 15560 + }, + { + "epoch": 2.3, + "eval_loss": 1.1397802829742432, + "eval_runtime": 517.4103, + "eval_samples_per_second": 14.764, + "eval_wer": 0.38534549301009174, + "step": 15560 + }, + { + "epoch": 2.31, + "learning_rate": 8.879821958456974e-06, + "loss": 1.1792, + "step": 15600 + }, + { + "epoch": 2.31, + "eval_loss": 1.1419965028762817, + "eval_runtime": 515.2357, + "eval_samples_per_second": 14.826, + "eval_wer": 0.3848308985391235, + "step": 15600 + }, + { + "epoch": 2.31, + "learning_rate": 8.87685459940653e-06, + "loss": 1.1582, + "step": 15640 + }, + { + "epoch": 2.31, + "eval_loss": 1.1558929681777954, + "eval_runtime": 514.8951, + "eval_samples_per_second": 14.836, + "eval_wer": 0.3852311386832099, + "step": 15640 + }, + { + "epoch": 2.32, + "learning_rate": 8.873887240356084e-06, + "loss": 1.1773, + "step": 15680 + }, + { + "epoch": 2.32, + "eval_loss": 1.1893229484558105, + "eval_runtime": 514.0693, + "eval_samples_per_second": 14.86, + "eval_wer": 0.3893478944509563, + "step": 15680 + }, + { + "epoch": 2.32, + "learning_rate": 8.870919881305639e-06, + "loss": 1.0788, + "step": 15720 + }, + { + "epoch": 2.32, + "eval_loss": 1.1800158023834229, + "eval_runtime": 515.5535, + "eval_samples_per_second": 14.817, + "eval_wer": 0.38760399096600817, + "step": 15720 + }, + { + "epoch": 2.33, + "learning_rate": 8.867952522255193e-06, + "loss": 1.1262, + "step": 15760 + }, + { + "epoch": 2.33, + "eval_loss": 1.1686158180236816, + "eval_runtime": 515.9798, + "eval_samples_per_second": 14.805, + "eval_wer": 0.38777552245633096, + "step": 15760 + }, + { + "epoch": 2.34, + "learning_rate": 8.86498516320475e-06, + "loss": 1.2084, + "step": 15800 + }, + { + "epoch": 2.34, + "eval_loss": 1.0843065977096558, + "eval_runtime": 514.0643, + "eval_samples_per_second": 14.86, + "eval_wer": 0.3800280168100861, + "step": 15800 + }, + { + "epoch": 2.34, + "learning_rate": 8.862017804154304e-06, + "loss": 1.2121, + "step": 15840 + }, + { + "epoch": 2.34, + "eval_loss": 1.1317861080169678, + "eval_runtime": 514.4059, + "eval_samples_per_second": 14.85, + "eval_wer": 0.3843163040681552, + "step": 15840 + }, + { + "epoch": 2.35, + "learning_rate": 8.859050445103858e-06, + "loss": 1.1509, + "step": 15880 + }, + { + "epoch": 2.35, + "eval_loss": 1.1995600461959839, + "eval_runtime": 514.1483, + "eval_samples_per_second": 14.858, + "eval_wer": 0.39003402041224733, + "step": 15880 + }, + { + "epoch": 2.35, + "learning_rate": 8.856083086053413e-06, + "loss": 1.2393, + "step": 15920 + }, + { + "epoch": 2.35, + "eval_loss": 1.1386741399765015, + "eval_runtime": 514.09, + "eval_samples_per_second": 14.859, + "eval_wer": 0.38440206981331654, + "step": 15920 + }, + { + "epoch": 2.36, + "learning_rate": 8.853115727002967e-06, + "loss": 1.2539, + "step": 15960 + }, + { + "epoch": 2.36, + "eval_loss": 1.1492124795913696, + "eval_runtime": 514.4977, + "eval_samples_per_second": 14.847, + "eval_wer": 0.38623173904342606, + "step": 15960 + }, + { + "epoch": 2.37, + "learning_rate": 8.850148367952523e-06, + "loss": 1.2283, + "step": 16000 + }, + { + "epoch": 2.37, + "eval_loss": 1.099195957183838, + "eval_runtime": 513.9509, + "eval_samples_per_second": 14.863, + "eval_wer": 0.3825438120014866, + "step": 16000 + }, + { + "epoch": 2.37, + "learning_rate": 8.847181008902078e-06, + "loss": 1.1774, + "step": 16040 + }, + { + "epoch": 2.37, + "eval_loss": 1.1555029153823853, + "eval_runtime": 514.946, + "eval_samples_per_second": 14.835, + "eval_wer": 0.3865748020240716, + "step": 16040 + }, + { + "epoch": 2.38, + "learning_rate": 8.844213649851632e-06, + "loss": 1.2068, + "step": 16080 + }, + { + "epoch": 2.38, + "eval_loss": 1.1306747198104858, + "eval_runtime": 513.7635, + "eval_samples_per_second": 14.869, + "eval_wer": 0.38400182966923013, + "step": 16080 + }, + { + "epoch": 2.38, + "learning_rate": 8.841246290801188e-06, + "loss": 1.1724, + "step": 16120 + }, + { + "epoch": 2.38, + "eval_loss": 1.1298811435699463, + "eval_runtime": 520.6639, + "eval_samples_per_second": 14.672, + "eval_wer": 0.3830584064724549, + "step": 16120 + }, + { + "epoch": 2.39, + "learning_rate": 8.838278931750743e-06, + "loss": 1.1736, + "step": 16160 + }, + { + "epoch": 2.39, + "eval_loss": 1.171027660369873, + "eval_runtime": 516.0891, + "eval_samples_per_second": 14.802, + "eval_wer": 0.3865176248606307, + "step": 16160 + }, + { + "epoch": 2.39, + "learning_rate": 8.835311572700297e-06, + "loss": 1.2153, + "step": 16200 + }, + { + "epoch": 2.39, + "eval_loss": 1.1371372938156128, + "eval_runtime": 515.9108, + "eval_samples_per_second": 14.807, + "eval_wer": 0.3843163040681552, + "step": 16200 + }, + { + "epoch": 2.4, + "learning_rate": 8.832344213649853e-06, + "loss": 1.1917, + "step": 16240 + }, + { + "epoch": 2.4, + "eval_loss": 1.1220273971557617, + "eval_runtime": 519.3713, + "eval_samples_per_second": 14.708, + "eval_wer": 0.382257926184282, + "step": 16240 + }, + { + "epoch": 2.41, + "learning_rate": 8.829376854599408e-06, + "loss": 1.2098, + "step": 16280 + }, + { + "epoch": 2.41, + "eval_loss": 1.124094843864441, + "eval_runtime": 515.6405, + "eval_samples_per_second": 14.815, + "eval_wer": 0.3820006289487978, + "step": 16280 + }, + { + "epoch": 2.41, + "learning_rate": 8.826409495548962e-06, + "loss": 1.1973, + "step": 16320 + }, + { + "epoch": 2.41, + "eval_loss": 1.1830039024353027, + "eval_runtime": 514.0734, + "eval_samples_per_second": 14.86, + "eval_wer": 0.3866033906057921, + "step": 16320 + }, + { + "epoch": 2.42, + "learning_rate": 8.823442136498517e-06, + "loss": 1.2254, + "step": 16360 + }, + { + "epoch": 2.42, + "eval_loss": 1.1085596084594727, + "eval_runtime": 518.9471, + "eval_samples_per_second": 14.72, + "eval_wer": 0.379713542411161, + "step": 16360 + }, + { + "epoch": 2.42, + "learning_rate": 8.820474777448071e-06, + "loss": 1.2464, + "step": 16400 + }, + { + "epoch": 2.42, + "eval_loss": 1.1189533472061157, + "eval_runtime": 514.8256, + "eval_samples_per_second": 14.838, + "eval_wer": 0.38111438291546357, + "step": 16400 + }, + { + "epoch": 2.43, + "learning_rate": 8.817507418397627e-06, + "loss": 1.2586, + "step": 16440 + }, + { + "epoch": 2.43, + "eval_loss": 1.1045169830322266, + "eval_runtime": 515.7923, + "eval_samples_per_second": 14.81, + "eval_wer": 0.3812287372423454, + "step": 16440 + }, + { + "epoch": 2.44, + "learning_rate": 8.814540059347182e-06, + "loss": 1.2458, + "step": 16480 + }, + { + "epoch": 2.44, + "eval_loss": 1.0960806608200073, + "eval_runtime": 516.0913, + "eval_samples_per_second": 14.802, + "eval_wer": 0.38039966837245204, + "step": 16480 + }, + { + "epoch": 2.44, + "learning_rate": 8.811572700296736e-06, + "loss": 1.159, + "step": 16520 + }, + { + "epoch": 2.44, + "eval_loss": 1.1752724647521973, + "eval_runtime": 516.7188, + "eval_samples_per_second": 14.784, + "eval_wer": 0.38666056776923297, + "step": 16520 + }, + { + "epoch": 2.45, + "learning_rate": 8.80860534124629e-06, + "loss": 1.1689, + "step": 16560 + }, + { + "epoch": 2.45, + "eval_loss": 1.1486188173294067, + "eval_runtime": 516.0173, + "eval_samples_per_second": 14.804, + "eval_wer": 0.38448783555847793, + "step": 16560 + }, + { + "epoch": 2.45, + "learning_rate": 8.805637982195847e-06, + "loss": 1.1315, + "step": 16600 + }, + { + "epoch": 2.45, + "eval_loss": 1.1468220949172974, + "eval_runtime": 519.4606, + "eval_samples_per_second": 14.706, + "eval_wer": 0.38485948712084395, + "step": 16600 + }, + { + "epoch": 2.46, + "learning_rate": 8.802670623145401e-06, + "loss": 1.25, + "step": 16640 + }, + { + "epoch": 2.46, + "eval_loss": 1.1769051551818848, + "eval_runtime": 516.7304, + "eval_samples_per_second": 14.783, + "eval_wer": 0.3864318591154693, + "step": 16640 + }, + { + "epoch": 2.47, + "learning_rate": 8.799703264094957e-06, + "loss": 1.1341, + "step": 16680 + }, + { + "epoch": 2.47, + "eval_loss": 1.2113075256347656, + "eval_runtime": 516.1179, + "eval_samples_per_second": 14.801, + "eval_wer": 0.3884044712541811, + "step": 16680 + }, + { + "epoch": 2.47, + "learning_rate": 8.796735905044512e-06, + "loss": 1.2025, + "step": 16720 + }, + { + "epoch": 2.47, + "eval_loss": 1.1068987846374512, + "eval_runtime": 517.3405, + "eval_samples_per_second": 14.766, + "eval_wer": 0.37945624517567683, + "step": 16720 + }, + { + "epoch": 2.48, + "learning_rate": 8.793768545994066e-06, + "loss": 1.2243, + "step": 16760 + }, + { + "epoch": 2.48, + "eval_loss": 1.1009721755981445, + "eval_runtime": 516.8269, + "eval_samples_per_second": 14.781, + "eval_wer": 0.37914177077675176, + "step": 16760 + }, + { + "epoch": 2.48, + "learning_rate": 8.79080118694362e-06, + "loss": 1.2169, + "step": 16800 + }, + { + "epoch": 2.48, + "eval_loss": 1.13065505027771, + "eval_runtime": 516.3526, + "eval_samples_per_second": 14.794, + "eval_wer": 0.3832585265444981, + "step": 16800 + }, + { + "epoch": 2.49, + "learning_rate": 8.787833827893177e-06, + "loss": 1.149, + "step": 16840 + }, + { + "epoch": 2.49, + "eval_loss": 1.14747154712677, + "eval_runtime": 516.1495, + "eval_samples_per_second": 14.8, + "eval_wer": 0.3835158237799823, + "step": 16840 + }, + { + "epoch": 2.5, + "learning_rate": 8.784866468842731e-06, + "loss": 1.2755, + "step": 16880 + }, + { + "epoch": 2.5, + "eval_loss": 1.0690319538116455, + "eval_runtime": 515.8956, + "eval_samples_per_second": 14.807, + "eval_wer": 0.3782555247434175, + "step": 16880 + }, + { + "epoch": 2.5, + "learning_rate": 8.781899109792286e-06, + "loss": 1.1765, + "step": 16920 + }, + { + "epoch": 2.5, + "eval_loss": 1.1521514654159546, + "eval_runtime": 515.9101, + "eval_samples_per_second": 14.807, + "eval_wer": 0.385173961519769, + "step": 16920 + }, + { + "epoch": 2.51, + "learning_rate": 8.77893175074184e-06, + "loss": 1.2121, + "step": 16960 + }, + { + "epoch": 2.51, + "eval_loss": 1.1224206686019897, + "eval_runtime": 514.1763, + "eval_samples_per_second": 14.857, + "eval_wer": 0.3823436919294434, + "step": 16960 + }, + { + "epoch": 2.51, + "learning_rate": 8.775964391691394e-06, + "loss": 1.1043, + "step": 17000 + }, + { + "epoch": 2.51, + "eval_loss": 1.157297968864441, + "eval_runtime": 515.382, + "eval_samples_per_second": 14.822, + "eval_wer": 0.38337288087138, + "step": 17000 + }, + { + "epoch": 2.52, + "learning_rate": 8.77299703264095e-06, + "loss": 1.1288, + "step": 17040 + }, + { + "epoch": 2.52, + "eval_loss": 1.1980996131896973, + "eval_runtime": 515.1928, + "eval_samples_per_second": 14.827, + "eval_wer": 0.3865462134423511, + "step": 17040 + }, + { + "epoch": 2.52, + "learning_rate": 8.770029673590505e-06, + "loss": 1.1612, + "step": 17080 + }, + { + "epoch": 2.52, + "eval_loss": 1.158414363861084, + "eval_runtime": 517.5318, + "eval_samples_per_second": 14.76, + "eval_wer": 0.3832013493810572, + "step": 17080 + }, + { + "epoch": 2.53, + "learning_rate": 8.76706231454006e-06, + "loss": 1.1713, + "step": 17120 + }, + { + "epoch": 2.53, + "eval_loss": 1.1759231090545654, + "eval_runtime": 516.3896, + "eval_samples_per_second": 14.793, + "eval_wer": 0.3848880757025644, + "step": 17120 + }, + { + "epoch": 2.54, + "learning_rate": 8.764094955489616e-06, + "loss": 1.1009, + "step": 17160 + }, + { + "epoch": 2.54, + "eval_loss": 1.1567894220352173, + "eval_runtime": 515.7588, + "eval_samples_per_second": 14.811, + "eval_wer": 0.3825152234197661, + "step": 17160 + }, + { + "epoch": 2.54, + "learning_rate": 8.76112759643917e-06, + "loss": 1.1933, + "step": 17200 + }, + { + "epoch": 2.54, + "eval_loss": 1.1462833881378174, + "eval_runtime": 515.7317, + "eval_samples_per_second": 14.812, + "eval_wer": 0.38308699505417537, + "step": 17200 + }, + { + "epoch": 2.55, + "learning_rate": 8.758160237388725e-06, + "loss": 1.1916, + "step": 17240 + }, + { + "epoch": 2.55, + "eval_loss": 1.1652922630310059, + "eval_runtime": 517.3946, + "eval_samples_per_second": 14.764, + "eval_wer": 0.38463077846708027, + "step": 17240 + }, + { + "epoch": 2.55, + "learning_rate": 8.75519287833828e-06, + "loss": 1.1473, + "step": 17280 + }, + { + "epoch": 2.55, + "eval_loss": 1.2009822130203247, + "eval_runtime": 517.4811, + "eval_samples_per_second": 14.762, + "eval_wer": 0.38826152834557875, + "step": 17280 + }, + { + "epoch": 2.56, + "learning_rate": 8.752225519287835e-06, + "loss": 1.1388, + "step": 17320 + }, + { + "epoch": 2.56, + "eval_loss": 1.16202974319458, + "eval_runtime": 516.5131, + "eval_samples_per_second": 14.79, + "eval_wer": 0.38463077846708027, + "step": 17320 + }, + { + "epoch": 2.57, + "learning_rate": 8.74925816023739e-06, + "loss": 1.1555, + "step": 17360 + }, + { + "epoch": 2.57, + "eval_loss": 1.1844778060913086, + "eval_runtime": 515.2162, + "eval_samples_per_second": 14.827, + "eval_wer": 0.38666056776923297, + "step": 17360 + }, + { + "epoch": 2.57, + "learning_rate": 8.746290801186944e-06, + "loss": 1.2388, + "step": 17400 + }, + { + "epoch": 2.57, + "eval_loss": 1.1465528011322021, + "eval_runtime": 516.9239, + "eval_samples_per_second": 14.778, + "eval_wer": 0.38297264072729353, + "step": 17400 + }, + { + "epoch": 2.58, + "learning_rate": 8.743323442136498e-06, + "loss": 1.2875, + "step": 17440 + }, + { + "epoch": 2.58, + "eval_loss": 1.1762466430664062, + "eval_runtime": 519.1698, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3861745618799851, + "step": 17440 + }, + { + "epoch": 2.58, + "learning_rate": 8.740356083086055e-06, + "loss": 1.137, + "step": 17480 + }, + { + "epoch": 2.58, + "eval_loss": 1.1911572217941284, + "eval_runtime": 515.6366, + "eval_samples_per_second": 14.815, + "eval_wer": 0.3875754023842877, + "step": 17480 + }, + { + "epoch": 2.59, + "learning_rate": 8.737388724035609e-06, + "loss": 1.1515, + "step": 17520 + }, + { + "epoch": 2.59, + "eval_loss": 1.1504846811294556, + "eval_runtime": 517.0111, + "eval_samples_per_second": 14.775, + "eval_wer": 0.38388747534234824, + "step": 17520 + }, + { + "epoch": 2.6, + "learning_rate": 8.734421364985163e-06, + "loss": 1.2847, + "step": 17560 + }, + { + "epoch": 2.6, + "eval_loss": 1.1752811670303345, + "eval_runtime": 516.3273, + "eval_samples_per_second": 14.795, + "eval_wer": 0.3871179850767603, + "step": 17560 + }, + { + "epoch": 2.6, + "learning_rate": 8.731454005934718e-06, + "loss": 1.1622, + "step": 17600 + }, + { + "epoch": 2.6, + "eval_loss": 1.123414158821106, + "eval_runtime": 515.7539, + "eval_samples_per_second": 14.811, + "eval_wer": 0.38185768604019554, + "step": 17600 + }, + { + "epoch": 2.61, + "learning_rate": 8.728486646884274e-06, + "loss": 1.1508, + "step": 17640 + }, + { + "epoch": 2.61, + "eval_loss": 1.1775832176208496, + "eval_runtime": 516.9514, + "eval_samples_per_second": 14.777, + "eval_wer": 0.38683209925955575, + "step": 17640 + }, + { + "epoch": 2.61, + "learning_rate": 8.725519287833828e-06, + "loss": 1.0831, + "step": 17680 + }, + { + "epoch": 2.61, + "eval_loss": 1.2460119724273682, + "eval_runtime": 518.9921, + "eval_samples_per_second": 14.719, + "eval_wer": 0.3918351010606364, + "step": 17680 + }, + { + "epoch": 2.62, + "learning_rate": 8.722551928783383e-06, + "loss": 1.1615, + "step": 17720 + }, + { + "epoch": 2.62, + "eval_loss": 1.2202004194259644, + "eval_runtime": 515.6757, + "eval_samples_per_second": 14.814, + "eval_wer": 0.38783269961977185, + "step": 17720 + }, + { + "epoch": 2.63, + "learning_rate": 8.719584569732939e-06, + "loss": 1.1371, + "step": 17760 + }, + { + "epoch": 2.63, + "eval_loss": 1.1302050352096558, + "eval_runtime": 515.2488, + "eval_samples_per_second": 14.826, + "eval_wer": 0.37894165070470853, + "step": 17760 + }, + { + "epoch": 2.63, + "learning_rate": 8.716617210682493e-06, + "loss": 1.2133, + "step": 17800 + }, + { + "epoch": 2.63, + "eval_loss": 1.221242904663086, + "eval_runtime": 516.8966, + "eval_samples_per_second": 14.779, + "eval_wer": 0.388089996855256, + "step": 17800 + }, + { + "epoch": 2.64, + "learning_rate": 8.713649851632048e-06, + "loss": 1.1797, + "step": 17840 + }, + { + "epoch": 2.64, + "eval_loss": 1.133954644203186, + "eval_runtime": 514.9141, + "eval_samples_per_second": 14.835, + "eval_wer": 0.3806569656079362, + "step": 17840 + }, + { + "epoch": 2.64, + "learning_rate": 8.710682492581604e-06, + "loss": 1.2021, + "step": 17880 + }, + { + "epoch": 2.64, + "eval_loss": 1.2000679969787598, + "eval_runtime": 514.8853, + "eval_samples_per_second": 14.836, + "eval_wer": 0.3874610480574059, + "step": 17880 + }, + { + "epoch": 2.65, + "learning_rate": 8.707715133531159e-06, + "loss": 1.2414, + "step": 17920 + }, + { + "epoch": 2.65, + "eval_loss": 1.0796840190887451, + "eval_runtime": 515.6668, + "eval_samples_per_second": 14.814, + "eval_wer": 0.3755967866434146, + "step": 17920 + }, + { + "epoch": 2.65, + "learning_rate": 8.704747774480713e-06, + "loss": 1.1007, + "step": 17960 + }, + { + "epoch": 2.65, + "eval_loss": 1.134572148323059, + "eval_runtime": 514.8571, + "eval_samples_per_second": 14.837, + "eval_wer": 0.3796849538294405, + "step": 17960 + }, + { + "epoch": 2.66, + "learning_rate": 8.701780415430267e-06, + "loss": 1.1547, + "step": 18000 + }, + { + "epoch": 2.66, + "eval_loss": 1.1803171634674072, + "eval_runtime": 517.471, + "eval_samples_per_second": 14.762, + "eval_wer": 0.38360158952514367, + "step": 18000 + }, + { + "epoch": 2.67, + "learning_rate": 8.698813056379822e-06, + "loss": 1.177, + "step": 18040 + }, + { + "epoch": 2.67, + "eval_loss": 1.1421719789505005, + "eval_runtime": 516.2962, + "eval_samples_per_second": 14.796, + "eval_wer": 0.38128591440578635, + "step": 18040 + }, + { + "epoch": 2.67, + "learning_rate": 8.695845697329378e-06, + "loss": 1.1647, + "step": 18080 + }, + { + "epoch": 2.67, + "eval_loss": 1.1459816694259644, + "eval_runtime": 515.5688, + "eval_samples_per_second": 14.817, + "eval_wer": 0.38214357185740017, + "step": 18080 + }, + { + "epoch": 2.68, + "learning_rate": 8.692878338278932e-06, + "loss": 1.1651, + "step": 18120 + }, + { + "epoch": 2.68, + "eval_loss": 1.1298251152038574, + "eval_runtime": 514.6921, + "eval_samples_per_second": 14.842, + "eval_wer": 0.37965636524772006, + "step": 18120 + }, + { + "epoch": 2.68, + "learning_rate": 8.689910979228487e-06, + "loss": 1.2419, + "step": 18160 + }, + { + "epoch": 2.68, + "eval_loss": 1.1433261632919312, + "eval_runtime": 515.2221, + "eval_samples_per_second": 14.827, + "eval_wer": 0.38134309156922724, + "step": 18160 + }, + { + "epoch": 2.69, + "learning_rate": 8.686943620178043e-06, + "loss": 1.2426, + "step": 18200 + }, + { + "epoch": 2.69, + "eval_loss": 1.1591742038726807, + "eval_runtime": 513.8262, + "eval_samples_per_second": 14.867, + "eval_wer": 0.3825438120014866, + "step": 18200 + }, + { + "epoch": 2.7, + "learning_rate": 8.683976261127597e-06, + "loss": 1.1744, + "step": 18240 + }, + { + "epoch": 2.7, + "eval_loss": 1.1115648746490479, + "eval_runtime": 516.907, + "eval_samples_per_second": 14.778, + "eval_wer": 0.3781697589982561, + "step": 18240 + }, + { + "epoch": 2.7, + "learning_rate": 8.681008902077152e-06, + "loss": 1.1531, + "step": 18280 + }, + { + "epoch": 2.7, + "eval_loss": 1.1400363445281982, + "eval_runtime": 516.1373, + "eval_samples_per_second": 14.8, + "eval_wer": 0.38059978844449527, + "step": 18280 + }, + { + "epoch": 2.71, + "learning_rate": 8.678041543026708e-06, + "loss": 1.1431, + "step": 18320 + }, + { + "epoch": 2.71, + "eval_loss": 1.176941990852356, + "eval_runtime": 514.8294, + "eval_samples_per_second": 14.838, + "eval_wer": 0.3836301781068641, + "step": 18320 + }, + { + "epoch": 2.71, + "learning_rate": 8.675074183976262e-06, + "loss": 1.1406, + "step": 18360 + }, + { + "epoch": 2.71, + "eval_loss": 1.1419347524642944, + "eval_runtime": 515.3852, + "eval_samples_per_second": 14.822, + "eval_wer": 0.37982789673804285, + "step": 18360 + }, + { + "epoch": 2.72, + "learning_rate": 8.672106824925817e-06, + "loss": 1.2016, + "step": 18400 + }, + { + "epoch": 2.72, + "eval_loss": 1.1380963325500488, + "eval_runtime": 516.9084, + "eval_samples_per_second": 14.778, + "eval_wer": 0.37957059950255867, + "step": 18400 + }, + { + "epoch": 2.73, + "learning_rate": 8.669139465875371e-06, + "loss": 1.2381, + "step": 18440 + }, + { + "epoch": 2.73, + "eval_loss": 1.1630064249038696, + "eval_runtime": 514.5662, + "eval_samples_per_second": 14.846, + "eval_wer": 0.38177192029503415, + "step": 18440 + }, + { + "epoch": 2.73, + "learning_rate": 8.666172106824926e-06, + "loss": 1.0927, + "step": 18480 + }, + { + "epoch": 2.73, + "eval_loss": 1.1508713960647583, + "eval_runtime": 517.2426, + "eval_samples_per_second": 14.769, + "eval_wer": 0.379713542411161, + "step": 18480 + }, + { + "epoch": 2.74, + "learning_rate": 8.663204747774482e-06, + "loss": 1.18, + "step": 18520 + }, + { + "epoch": 2.74, + "eval_loss": 1.0874180793762207, + "eval_runtime": 515.8383, + "eval_samples_per_second": 14.809, + "eval_wer": 0.37519654649932815, + "step": 18520 + }, + { + "epoch": 2.74, + "learning_rate": 8.660237388724036e-06, + "loss": 1.1011, + "step": 18560 + }, + { + "epoch": 2.74, + "eval_loss": 1.22551429271698, + "eval_runtime": 515.8982, + "eval_samples_per_second": 14.807, + "eval_wer": 0.3865176248606307, + "step": 18560 + }, + { + "epoch": 2.75, + "learning_rate": 8.65727002967359e-06, + "loss": 1.1406, + "step": 18600 + }, + { + "epoch": 2.75, + "eval_loss": 1.1352531909942627, + "eval_runtime": 515.5557, + "eval_samples_per_second": 14.817, + "eval_wer": 0.37819834757997656, + "step": 18600 + }, + { + "epoch": 2.76, + "learning_rate": 8.654302670623145e-06, + "loss": 1.2046, + "step": 18640 + }, + { + "epoch": 2.76, + "eval_loss": 1.152807593345642, + "eval_runtime": 516.9363, + "eval_samples_per_second": 14.777, + "eval_wer": 0.3801137825552474, + "step": 18640 + }, + { + "epoch": 2.76, + "learning_rate": 8.651335311572701e-06, + "loss": 1.2021, + "step": 18680 + }, + { + "epoch": 2.76, + "eval_loss": 1.1246099472045898, + "eval_runtime": 516.087, + "eval_samples_per_second": 14.802, + "eval_wer": 0.377483633036965, + "step": 18680 + }, + { + "epoch": 2.77, + "learning_rate": 8.648367952522256e-06, + "loss": 1.2423, + "step": 18720 + }, + { + "epoch": 2.77, + "eval_loss": 1.1400781869888306, + "eval_runtime": 517.6704, + "eval_samples_per_second": 14.756, + "eval_wer": 0.3791131821950313, + "step": 18720 + }, + { + "epoch": 2.77, + "learning_rate": 8.64540059347181e-06, + "loss": 1.1445, + "step": 18760 + }, + { + "epoch": 2.77, + "eval_loss": 1.1320958137512207, + "eval_runtime": 516.6712, + "eval_samples_per_second": 14.785, + "eval_wer": 0.37879870779610625, + "step": 18760 + }, + { + "epoch": 2.78, + "learning_rate": 8.642433234421366e-06, + "loss": 1.1884, + "step": 18800 + }, + { + "epoch": 2.78, + "eval_loss": 1.0789518356323242, + "eval_runtime": 515.7106, + "eval_samples_per_second": 14.813, + "eval_wer": 0.3746533634466394, + "step": 18800 + }, + { + "epoch": 2.78, + "learning_rate": 8.63946587537092e-06, + "loss": 1.1928, + "step": 18840 + }, + { + "epoch": 2.78, + "eval_loss": 1.1202785968780518, + "eval_runtime": 516.8609, + "eval_samples_per_second": 14.78, + "eval_wer": 0.3781697589982561, + "step": 18840 + }, + { + "epoch": 2.79, + "learning_rate": 8.636498516320475e-06, + "loss": 1.297, + "step": 18880 + }, + { + "epoch": 2.79, + "eval_loss": 1.0720806121826172, + "eval_runtime": 517.5214, + "eval_samples_per_second": 14.761, + "eval_wer": 0.3749106606821236, + "step": 18880 + }, + { + "epoch": 2.8, + "learning_rate": 8.633531157270031e-06, + "loss": 1.1808, + "step": 18920 + }, + { + "epoch": 2.8, + "eval_loss": 1.1131999492645264, + "eval_runtime": 516.1991, + "eval_samples_per_second": 14.799, + "eval_wer": 0.37811258183481516, + "step": 18920 + }, + { + "epoch": 2.8, + "learning_rate": 8.630563798219586e-06, + "loss": 1.1685, + "step": 18960 + }, + { + "epoch": 2.8, + "eval_loss": 1.11384916305542, + "eval_runtime": 516.3065, + "eval_samples_per_second": 14.795, + "eval_wer": 0.37708339289287857, + "step": 18960 + }, + { + "epoch": 2.81, + "learning_rate": 8.62759643916914e-06, + "loss": 1.2532, + "step": 19000 + }, + { + "epoch": 2.81, + "eval_loss": 1.1217172145843506, + "eval_runtime": 516.7246, + "eval_samples_per_second": 14.784, + "eval_wer": 0.37819834757997656, + "step": 19000 + }, + { + "epoch": 2.81, + "learning_rate": 8.624629080118695e-06, + "loss": 1.1244, + "step": 19040 + }, + { + "epoch": 2.81, + "eval_loss": 1.1175669431686401, + "eval_runtime": 516.1, + "eval_samples_per_second": 14.801, + "eval_wer": 0.3781697589982561, + "step": 19040 + }, + { + "epoch": 2.82, + "learning_rate": 8.62166172106825e-06, + "loss": 1.0988, + "step": 19080 + }, + { + "epoch": 2.82, + "eval_loss": 1.1343427896499634, + "eval_runtime": 515.5864, + "eval_samples_per_second": 14.816, + "eval_wer": 0.378970239286429, + "step": 19080 + }, + { + "epoch": 2.83, + "learning_rate": 8.618694362017805e-06, + "loss": 1.1842, + "step": 19120 + }, + { + "epoch": 2.83, + "eval_loss": 1.1403149366378784, + "eval_runtime": 516.3351, + "eval_samples_per_second": 14.795, + "eval_wer": 0.3794276565939564, + "step": 19120 + }, + { + "epoch": 2.83, + "learning_rate": 8.61572700296736e-06, + "loss": 1.175, + "step": 19160 + }, + { + "epoch": 2.83, + "eval_loss": 1.1043176651000977, + "eval_runtime": 516.7219, + "eval_samples_per_second": 14.784, + "eval_wer": 0.3770548043111581, + "step": 19160 + }, + { + "epoch": 2.84, + "learning_rate": 8.612759643916914e-06, + "loss": 1.1973, + "step": 19200 + }, + { + "epoch": 2.84, + "eval_loss": 1.1285748481750488, + "eval_runtime": 517.6517, + "eval_samples_per_second": 14.757, + "eval_wer": 0.37928471368535405, + "step": 19200 + }, + { + "epoch": 2.84, + "learning_rate": 8.609792284866469e-06, + "loss": 1.1228, + "step": 19240 + }, + { + "epoch": 2.84, + "eval_loss": 1.1576749086380005, + "eval_runtime": 518.0152, + "eval_samples_per_second": 14.747, + "eval_wer": 0.3813716801509477, + "step": 19240 + }, + { + "epoch": 2.85, + "learning_rate": 8.606824925816025e-06, + "loss": 1.1334, + "step": 19280 + }, + { + "epoch": 2.85, + "eval_loss": 1.1222729682922363, + "eval_runtime": 516.019, + "eval_samples_per_second": 14.804, + "eval_wer": 0.3782555247434175, + "step": 19280 + }, + { + "epoch": 2.86, + "learning_rate": 8.60385756676558e-06, + "loss": 1.2958, + "step": 19320 + }, + { + "epoch": 2.86, + "eval_loss": 1.0419676303863525, + "eval_runtime": 517.9879, + "eval_samples_per_second": 14.747, + "eval_wer": 0.3729380485434118, + "step": 19320 + }, + { + "epoch": 2.86, + "learning_rate": 8.600890207715135e-06, + "loss": 1.2158, + "step": 19360 + }, + { + "epoch": 2.86, + "eval_loss": 1.1009387969970703, + "eval_runtime": 521.3626, + "eval_samples_per_second": 14.652, + "eval_wer": 0.37734069012836274, + "step": 19360 + }, + { + "epoch": 2.87, + "learning_rate": 8.59792284866469e-06, + "loss": 1.2198, + "step": 19400 + }, + { + "epoch": 2.87, + "eval_loss": 1.0753209590911865, + "eval_runtime": 515.5569, + "eval_samples_per_second": 14.817, + "eval_wer": 0.375682552388576, + "step": 19400 + }, + { + "epoch": 2.87, + "learning_rate": 8.594955489614244e-06, + "loss": 1.1454, + "step": 19440 + }, + { + "epoch": 2.87, + "eval_loss": 1.091271996498108, + "eval_runtime": 517.0365, + "eval_samples_per_second": 14.775, + "eval_wer": 0.37716915863803996, + "step": 19440 + }, + { + "epoch": 2.88, + "learning_rate": 8.591988130563799e-06, + "loss": 1.1959, + "step": 19480 + }, + { + "epoch": 2.88, + "eval_loss": 1.0927106142044067, + "eval_runtime": 516.347, + "eval_samples_per_second": 14.794, + "eval_wer": 0.3778838731810515, + "step": 19480 + }, + { + "epoch": 2.89, + "learning_rate": 8.589020771513353e-06, + "loss": 1.2008, + "step": 19520 + }, + { + "epoch": 2.89, + "eval_loss": 1.126986026763916, + "eval_runtime": 515.6236, + "eval_samples_per_second": 14.815, + "eval_wer": 0.3799994282283656, + "step": 19520 + }, + { + "epoch": 2.89, + "learning_rate": 8.58605341246291e-06, + "loss": 1.09, + "step": 19560 + }, + { + "epoch": 2.89, + "eval_loss": 1.115182638168335, + "eval_runtime": 518.0902, + "eval_samples_per_second": 14.745, + "eval_wer": 0.37785528459933104, + "step": 19560 + }, + { + "epoch": 2.9, + "learning_rate": 8.583086053412464e-06, + "loss": 1.2073, + "step": 19600 + }, + { + "epoch": 2.9, + "eval_loss": 1.098750352859497, + "eval_runtime": 518.357, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3762829126047057, + "step": 19600 + }, + { + "epoch": 2.9, + "learning_rate": 8.580118694362018e-06, + "loss": 1.1635, + "step": 19640 + }, + { + "epoch": 2.9, + "eval_loss": 1.0704712867736816, + "eval_runtime": 515.3914, + "eval_samples_per_second": 14.822, + "eval_wer": 0.37359558592298237, + "step": 19640 + }, + { + "epoch": 2.91, + "learning_rate": 8.577151335311573e-06, + "loss": 1.1736, + "step": 19680 + }, + { + "epoch": 2.91, + "eval_loss": 1.1426914930343628, + "eval_runtime": 515.819, + "eval_samples_per_second": 14.809, + "eval_wer": 0.3799422510649247, + "step": 19680 + }, + { + "epoch": 2.91, + "learning_rate": 8.574183976261127e-06, + "loss": 1.202, + "step": 19720 + }, + { + "epoch": 2.91, + "eval_loss": 1.1212471723556519, + "eval_runtime": 515.9544, + "eval_samples_per_second": 14.806, + "eval_wer": 0.377483633036965, + "step": 19720 + }, + { + "epoch": 2.92, + "learning_rate": 8.571216617210683e-06, + "loss": 1.2141, + "step": 19760 + }, + { + "epoch": 2.92, + "eval_loss": 1.1012051105499268, + "eval_runtime": 515.5679, + "eval_samples_per_second": 14.817, + "eval_wer": 0.37696903856599673, + "step": 19760 + }, + { + "epoch": 2.93, + "learning_rate": 8.568249258160238e-06, + "loss": 1.1826, + "step": 19800 + }, + { + "epoch": 2.93, + "eval_loss": 1.1140936613082886, + "eval_runtime": 515.8615, + "eval_samples_per_second": 14.808, + "eval_wer": 0.37742645587352414, + "step": 19800 + }, + { + "epoch": 2.93, + "learning_rate": 8.565281899109794e-06, + "loss": 1.1723, + "step": 19840 + }, + { + "epoch": 2.93, + "eval_loss": 1.0519355535507202, + "eval_runtime": 516.735, + "eval_samples_per_second": 14.783, + "eval_wer": 0.3726807513079276, + "step": 19840 + }, + { + "epoch": 2.94, + "learning_rate": 8.562314540059348e-06, + "loss": 1.1668, + "step": 19880 + }, + { + "epoch": 2.94, + "eval_loss": 1.049087405204773, + "eval_runtime": 515.6057, + "eval_samples_per_second": 14.816, + "eval_wer": 0.37273792847136855, + "step": 19880 + }, + { + "epoch": 2.94, + "learning_rate": 8.559347181008903e-06, + "loss": 1.1601, + "step": 19920 + }, + { + "epoch": 2.94, + "eval_loss": 1.0791616439819336, + "eval_runtime": 516.4085, + "eval_samples_per_second": 14.793, + "eval_wer": 0.37402441464878927, + "step": 19920 + }, + { + "epoch": 2.95, + "learning_rate": 8.556379821958459e-06, + "loss": 1.2613, + "step": 19960 + }, + { + "epoch": 2.95, + "eval_loss": 1.1286110877990723, + "eval_runtime": 516.7442, + "eval_samples_per_second": 14.783, + "eval_wer": 0.37716915863803996, + "step": 19960 + }, + { + "epoch": 2.96, + "learning_rate": 8.553412462908013e-06, + "loss": 1.1734, + "step": 20000 + }, + { + "epoch": 2.96, + "eval_loss": 1.1111928224563599, + "eval_runtime": 516.3196, + "eval_samples_per_second": 14.795, + "eval_wer": 0.37596843820578063, + "step": 20000 + }, + { + "epoch": 2.96, + "learning_rate": 8.550445103857568e-06, + "loss": 1.1651, + "step": 20040 + }, + { + "epoch": 2.96, + "eval_loss": 1.2235898971557617, + "eval_runtime": 516.3571, + "eval_samples_per_second": 14.794, + "eval_wer": 0.3869464535864376, + "step": 20040 + }, + { + "epoch": 2.97, + "learning_rate": 8.547477744807122e-06, + "loss": 1.1606, + "step": 20080 + }, + { + "epoch": 2.97, + "eval_loss": 1.0352063179016113, + "eval_runtime": 520.5348, + "eval_samples_per_second": 14.675, + "eval_wer": 0.3706509620057749, + "step": 20080 + }, + { + "epoch": 2.97, + "learning_rate": 8.544510385756677e-06, + "loss": 1.1521, + "step": 20120 + }, + { + "epoch": 2.97, + "eval_loss": 1.0770621299743652, + "eval_runtime": 516.3297, + "eval_samples_per_second": 14.795, + "eval_wer": 0.37373852883158465, + "step": 20120 + }, + { + "epoch": 2.98, + "learning_rate": 8.541543026706233e-06, + "loss": 1.1915, + "step": 20160 + }, + { + "epoch": 2.98, + "eval_loss": 1.0596503019332886, + "eval_runtime": 514.5222, + "eval_samples_per_second": 14.847, + "eval_wer": 0.3719660367649161, + "step": 20160 + }, + { + "epoch": 2.99, + "learning_rate": 8.538575667655787e-06, + "loss": 1.1223, + "step": 20200 + }, + { + "epoch": 2.99, + "eval_loss": 1.1415525674819946, + "eval_runtime": 515.5759, + "eval_samples_per_second": 14.816, + "eval_wer": 0.3789130621229881, + "step": 20200 + }, + { + "epoch": 2.99, + "learning_rate": 8.535608308605342e-06, + "loss": 1.1826, + "step": 20240 + }, + { + "epoch": 2.99, + "eval_loss": 1.0877865552902222, + "eval_runtime": 515.0528, + "eval_samples_per_second": 14.831, + "eval_wer": 0.3740815918122302, + "step": 20240 + }, + { + "epoch": 3.0, + "learning_rate": 8.532640949554896e-06, + "loss": 1.1451, + "step": 20280 + }, + { + "epoch": 3.0, + "eval_loss": 1.0747556686401367, + "eval_runtime": 515.9536, + "eval_samples_per_second": 14.806, + "eval_wer": 0.37322393436061635, + "step": 20280 + }, + { + "epoch": 3.0, + "learning_rate": 8.529673590504452e-06, + "loss": 1.1999, + "step": 20320 + }, + { + "epoch": 3.0, + "eval_loss": 1.0862082242965698, + "eval_runtime": 513.4887, + "eval_samples_per_second": 14.877, + "eval_wer": 0.37536807798965094, + "step": 20320 + }, + { + "epoch": 3.01, + "learning_rate": 8.526706231454007e-06, + "loss": 1.1235, + "step": 20360 + }, + { + "epoch": 3.01, + "eval_loss": 1.128408670425415, + "eval_runtime": 516.217, + "eval_samples_per_second": 14.798, + "eval_wer": 0.37854141056062207, + "step": 20360 + }, + { + "epoch": 3.02, + "learning_rate": 8.523738872403563e-06, + "loss": 1.1597, + "step": 20400 + }, + { + "epoch": 3.02, + "eval_loss": 1.135339617729187, + "eval_runtime": 515.7078, + "eval_samples_per_second": 14.813, + "eval_wer": 0.3796849538294405, + "step": 20400 + }, + { + "epoch": 3.02, + "learning_rate": 8.520771513353117e-06, + "loss": 1.1563, + "step": 20440 + }, + { + "epoch": 3.02, + "eval_loss": 1.0884416103363037, + "eval_runtime": 514.3925, + "eval_samples_per_second": 14.851, + "eval_wer": 0.37433888904771434, + "step": 20440 + }, + { + "epoch": 3.03, + "learning_rate": 8.517804154302672e-06, + "loss": 1.1069, + "step": 20480 + }, + { + "epoch": 3.03, + "eval_loss": 1.157616376876831, + "eval_runtime": 515.0409, + "eval_samples_per_second": 14.832, + "eval_wer": 0.38082849709825894, + "step": 20480 + }, + { + "epoch": 3.03, + "learning_rate": 8.514836795252226e-06, + "loss": 1.0867, + "step": 20520 + }, + { + "epoch": 3.03, + "eval_loss": 1.1581332683563232, + "eval_runtime": 514.5428, + "eval_samples_per_second": 14.846, + "eval_wer": 0.3803710797907316, + "step": 20520 + }, + { + "epoch": 3.04, + "learning_rate": 8.51186943620178e-06, + "loss": 1.1283, + "step": 20560 + }, + { + "epoch": 3.04, + "eval_loss": 1.1061222553253174, + "eval_runtime": 514.8105, + "eval_samples_per_second": 14.838, + "eval_wer": 0.37556819806169417, + "step": 20560 + }, + { + "epoch": 3.05, + "learning_rate": 8.508902077151337e-06, + "loss": 1.1219, + "step": 20600 + }, + { + "epoch": 3.05, + "eval_loss": 1.1390607357025146, + "eval_runtime": 514.8769, + "eval_samples_per_second": 14.837, + "eval_wer": 0.378598587724063, + "step": 20600 + }, + { + "epoch": 3.05, + "learning_rate": 8.505934718100891e-06, + "loss": 1.1943, + "step": 20640 + }, + { + "epoch": 3.05, + "eval_loss": 1.035829782485962, + "eval_runtime": 514.0488, + "eval_samples_per_second": 14.86, + "eval_wer": 0.36965036164555876, + "step": 20640 + }, + { + "epoch": 3.06, + "learning_rate": 8.502967359050445e-06, + "loss": 1.1254, + "step": 20680 + }, + { + "epoch": 3.06, + "eval_loss": 1.0715820789337158, + "eval_runtime": 514.3522, + "eval_samples_per_second": 14.852, + "eval_wer": 0.373509820177821, + "step": 20680 + }, + { + "epoch": 3.06, + "learning_rate": 8.5e-06, + "loss": 1.1414, + "step": 20720 + }, + { + "epoch": 3.06, + "eval_loss": 1.0662944316864014, + "eval_runtime": 516.8478, + "eval_samples_per_second": 14.78, + "eval_wer": 0.3731953457788959, + "step": 20720 + }, + { + "epoch": 3.07, + "learning_rate": 8.497032640949554e-06, + "loss": 1.204, + "step": 20760 + }, + { + "epoch": 3.07, + "eval_loss": 1.0624639987945557, + "eval_runtime": 514.8652, + "eval_samples_per_second": 14.837, + "eval_wer": 0.3725949855627662, + "step": 20760 + }, + { + "epoch": 3.07, + "learning_rate": 8.49406528189911e-06, + "loss": 1.0996, + "step": 20800 + }, + { + "epoch": 3.07, + "eval_loss": 1.083921194076538, + "eval_runtime": 514.091, + "eval_samples_per_second": 14.859, + "eval_wer": 0.37419594613911206, + "step": 20800 + }, + { + "epoch": 3.08, + "learning_rate": 8.491097922848665e-06, + "loss": 1.208, + "step": 20840 + }, + { + "epoch": 3.08, + "eval_loss": 1.0995850563049316, + "eval_runtime": 514.7452, + "eval_samples_per_second": 14.84, + "eval_wer": 0.37648303267674893, + "step": 20840 + }, + { + "epoch": 3.09, + "learning_rate": 8.488130563798221e-06, + "loss": 1.0673, + "step": 20880 + }, + { + "epoch": 3.09, + "eval_loss": 1.1160041093826294, + "eval_runtime": 517.8167, + "eval_samples_per_second": 14.752, + "eval_wer": 0.3782555247434175, + "step": 20880 + }, + { + "epoch": 3.09, + "learning_rate": 8.485163204747776e-06, + "loss": 1.2303, + "step": 20920 + }, + { + "epoch": 3.09, + "eval_loss": 1.0817983150482178, + "eval_runtime": 516.0756, + "eval_samples_per_second": 14.802, + "eval_wer": 0.3751679579176077, + "step": 20920 + }, + { + "epoch": 3.1, + "learning_rate": 8.48219584569733e-06, + "loss": 1.1616, + "step": 20960 + }, + { + "epoch": 3.1, + "eval_loss": 1.1048927307128906, + "eval_runtime": 514.63, + "eval_samples_per_second": 14.844, + "eval_wer": 0.3759112610423397, + "step": 20960 + }, + { + "epoch": 3.1, + "learning_rate": 8.479228486646886e-06, + "loss": 1.1294, + "step": 21000 + }, + { + "epoch": 3.1, + "eval_loss": 1.0734093189239502, + "eval_runtime": 519.4523, + "eval_samples_per_second": 14.706, + "eval_wer": 0.3730238142885731, + "step": 21000 + }, + { + "epoch": 3.11, + "learning_rate": 8.47626112759644e-06, + "loss": 1.1483, + "step": 21040 + }, + { + "epoch": 3.11, + "eval_loss": 1.0604857206344604, + "eval_runtime": 517.0284, + "eval_samples_per_second": 14.775, + "eval_wer": 0.37228051116384114, + "step": 21040 + }, + { + "epoch": 3.12, + "learning_rate": 8.473293768545995e-06, + "loss": 1.1762, + "step": 21080 + }, + { + "epoch": 3.12, + "eval_loss": 1.1276168823242188, + "eval_runtime": 515.896, + "eval_samples_per_second": 14.807, + "eval_wer": 0.3773692787100832, + "step": 21080 + }, + { + "epoch": 3.12, + "learning_rate": 8.47032640949555e-06, + "loss": 1.1141, + "step": 21120 + }, + { + "epoch": 3.12, + "eval_loss": 1.0490329265594482, + "eval_runtime": 514.6539, + "eval_samples_per_second": 14.843, + "eval_wer": 0.36939306441007463, + "step": 21120 + }, + { + "epoch": 3.13, + "learning_rate": 8.467359050445104e-06, + "loss": 1.0878, + "step": 21160 + }, + { + "epoch": 3.13, + "eval_loss": 1.1174302101135254, + "eval_runtime": 516.1648, + "eval_samples_per_second": 14.8, + "eval_wer": 0.375682552388576, + "step": 21160 + }, + { + "epoch": 3.13, + "learning_rate": 8.46439169139466e-06, + "loss": 1.0959, + "step": 21200 + }, + { + "epoch": 3.13, + "eval_loss": 1.0837537050247192, + "eval_runtime": 517.2945, + "eval_samples_per_second": 14.767, + "eval_wer": 0.37325252294233685, + "step": 21200 + }, + { + "epoch": 3.14, + "learning_rate": 8.461424332344214e-06, + "loss": 1.1362, + "step": 21240 + }, + { + "epoch": 3.14, + "eval_loss": 1.0660594701766968, + "eval_runtime": 522.2208, + "eval_samples_per_second": 14.628, + "eval_wer": 0.3712227336401841, + "step": 21240 + }, + { + "epoch": 3.15, + "learning_rate": 8.458456973293769e-06, + "loss": 1.1943, + "step": 21280 + }, + { + "epoch": 3.15, + "eval_loss": 1.0806292295455933, + "eval_runtime": 518.0785, + "eval_samples_per_second": 14.745, + "eval_wer": 0.37222333400040025, + "step": 21280 + }, + { + "epoch": 3.15, + "learning_rate": 8.455489614243323e-06, + "loss": 1.1543, + "step": 21320 + }, + { + "epoch": 3.15, + "eval_loss": 1.0360326766967773, + "eval_runtime": 516.6576, + "eval_samples_per_second": 14.785, + "eval_wer": 0.36910717859287, + "step": 21320 + }, + { + "epoch": 3.16, + "learning_rate": 8.45252225519288e-06, + "loss": 1.0821, + "step": 21360 + }, + { + "epoch": 3.16, + "eval_loss": 1.1198805570602417, + "eval_runtime": 516.5216, + "eval_samples_per_second": 14.789, + "eval_wer": 0.37656879842191027, + "step": 21360 + }, + { + "epoch": 3.16, + "learning_rate": 8.449554896142434e-06, + "loss": 1.1285, + "step": 21400 + }, + { + "epoch": 3.16, + "eval_loss": 1.1015830039978027, + "eval_runtime": 516.9959, + "eval_samples_per_second": 14.776, + "eval_wer": 0.3749678378455645, + "step": 21400 + }, + { + "epoch": 3.17, + "learning_rate": 8.446587537091988e-06, + "loss": 1.1884, + "step": 21440 + }, + { + "epoch": 3.17, + "eval_loss": 1.0140068531036377, + "eval_runtime": 515.519, + "eval_samples_per_second": 14.818, + "eval_wer": 0.36682009205523314, + "step": 21440 + }, + { + "epoch": 3.18, + "learning_rate": 8.443620178041544e-06, + "loss": 1.1497, + "step": 21480 + }, + { + "epoch": 3.18, + "eval_loss": 1.0721839666366577, + "eval_runtime": 518.8796, + "eval_samples_per_second": 14.722, + "eval_wer": 0.37288087137997084, + "step": 21480 + }, + { + "epoch": 3.18, + "learning_rate": 8.440652818991099e-06, + "loss": 1.2484, + "step": 21520 + }, + { + "epoch": 3.18, + "eval_loss": 1.0338966846466064, + "eval_runtime": 519.2134, + "eval_samples_per_second": 14.713, + "eval_wer": 0.36856399554018127, + "step": 21520 + }, + { + "epoch": 3.19, + "learning_rate": 8.437685459940653e-06, + "loss": 1.2737, + "step": 21560 + }, + { + "epoch": 3.19, + "eval_loss": 1.0333644151687622, + "eval_runtime": 517.1258, + "eval_samples_per_second": 14.772, + "eval_wer": 0.3686783498670631, + "step": 21560 + }, + { + "epoch": 3.19, + "learning_rate": 8.434718100890208e-06, + "loss": 1.1637, + "step": 21600 + }, + { + "epoch": 3.19, + "eval_loss": 1.0518370866775513, + "eval_runtime": 517.4701, + "eval_samples_per_second": 14.762, + "eval_wer": 0.37039366477029073, + "step": 21600 + }, + { + "epoch": 3.2, + "learning_rate": 8.431750741839764e-06, + "loss": 1.1531, + "step": 21640 + }, + { + "epoch": 3.2, + "eval_loss": 1.1203532218933105, + "eval_runtime": 521.9575, + "eval_samples_per_second": 14.635, + "eval_wer": 0.3765116212584694, + "step": 21640 + }, + { + "epoch": 3.2, + "learning_rate": 8.428783382789318e-06, + "loss": 1.1296, + "step": 21680 + }, + { + "epoch": 3.2, + "eval_loss": 1.0469988584518433, + "eval_runtime": 515.2315, + "eval_samples_per_second": 14.826, + "eval_wer": 0.36959318448211786, + "step": 21680 + }, + { + "epoch": 3.21, + "learning_rate": 8.425816023738873e-06, + "loss": 1.1254, + "step": 21720 + }, + { + "epoch": 3.21, + "eval_loss": 1.0680608749389648, + "eval_runtime": 514.5791, + "eval_samples_per_second": 14.845, + "eval_wer": 0.3706223734240544, + "step": 21720 + }, + { + "epoch": 3.22, + "learning_rate": 8.422848664688427e-06, + "loss": 1.1541, + "step": 21760 + }, + { + "epoch": 3.22, + "eval_loss": 1.0869226455688477, + "eval_runtime": 515.4377, + "eval_samples_per_second": 14.82, + "eval_wer": 0.3728522827982504, + "step": 21760 + }, + { + "epoch": 3.22, + "learning_rate": 8.419881305637982e-06, + "loss": 1.1613, + "step": 21800 + }, + { + "epoch": 3.22, + "eval_loss": 1.0312713384628296, + "eval_runtime": 514.8343, + "eval_samples_per_second": 14.838, + "eval_wer": 0.3689356471025472, + "step": 21800 + }, + { + "epoch": 3.23, + "learning_rate": 8.416913946587538e-06, + "loss": 1.1442, + "step": 21840 + }, + { + "epoch": 3.23, + "eval_loss": 1.0625436305999756, + "eval_runtime": 515.7724, + "eval_samples_per_second": 14.811, + "eval_wer": 0.37010777895308616, + "step": 21840 + }, + { + "epoch": 3.23, + "learning_rate": 8.413946587537092e-06, + "loss": 1.2311, + "step": 21880 + }, + { + "epoch": 3.23, + "eval_loss": 1.0760008096694946, + "eval_runtime": 515.7087, + "eval_samples_per_second": 14.813, + "eval_wer": 0.3714514422939478, + "step": 21880 + }, + { + "epoch": 3.24, + "learning_rate": 8.410979228486648e-06, + "loss": 1.1762, + "step": 21920 + }, + { + "epoch": 3.24, + "eval_loss": 1.0661391019821167, + "eval_runtime": 516.1088, + "eval_samples_per_second": 14.801, + "eval_wer": 0.3713942651305069, + "step": 21920 + }, + { + "epoch": 3.25, + "learning_rate": 8.408011869436203e-06, + "loss": 1.1926, + "step": 21960 + }, + { + "epoch": 3.25, + "eval_loss": 1.086608648300171, + "eval_runtime": 515.65, + "eval_samples_per_second": 14.814, + "eval_wer": 0.3730238142885731, + "step": 21960 + }, + { + "epoch": 3.25, + "learning_rate": 8.405044510385757e-06, + "loss": 1.1385, + "step": 22000 + }, + { + "epoch": 3.25, + "eval_loss": 1.0777784585952759, + "eval_runtime": 516.8973, + "eval_samples_per_second": 14.779, + "eval_wer": 0.37222333400040025, + "step": 22000 + }, + { + "epoch": 3.26, + "learning_rate": 8.402077151335313e-06, + "loss": 1.1241, + "step": 22040 + }, + { + "epoch": 3.26, + "eval_loss": 1.057078242301941, + "eval_runtime": 515.3241, + "eval_samples_per_second": 14.824, + "eval_wer": 0.37102261356814087, + "step": 22040 + }, + { + "epoch": 3.26, + "learning_rate": 8.399109792284868e-06, + "loss": 1.201, + "step": 22080 + }, + { + "epoch": 3.26, + "eval_loss": 1.049026608467102, + "eval_runtime": 514.7594, + "eval_samples_per_second": 14.84, + "eval_wer": 0.370222133279968, + "step": 22080 + }, + { + "epoch": 3.27, + "learning_rate": 8.396142433234422e-06, + "loss": 1.1901, + "step": 22120 + }, + { + "epoch": 3.27, + "eval_loss": 1.0657296180725098, + "eval_runtime": 516.4573, + "eval_samples_per_second": 14.791, + "eval_wer": 0.3714514422939478, + "step": 22120 + }, + { + "epoch": 3.28, + "learning_rate": 8.393175074183977e-06, + "loss": 1.1255, + "step": 22160 + }, + { + "epoch": 3.28, + "eval_loss": 1.0521280765533447, + "eval_runtime": 518.6377, + "eval_samples_per_second": 14.729, + "eval_wer": 0.36999342462620427, + "step": 22160 + }, + { + "epoch": 3.28, + "learning_rate": 8.390207715133531e-06, + "loss": 1.1628, + "step": 22200 + }, + { + "epoch": 3.28, + "eval_loss": 1.0484883785247803, + "eval_runtime": 515.3997, + "eval_samples_per_second": 14.822, + "eval_wer": 0.3701363675348066, + "step": 22200 + }, + { + "epoch": 3.29, + "learning_rate": 8.387240356083087e-06, + "loss": 1.1132, + "step": 22240 + }, + { + "epoch": 3.29, + "eval_loss": 1.1115612983703613, + "eval_runtime": 516.1493, + "eval_samples_per_second": 14.8, + "eval_wer": 0.3753966665713714, + "step": 22240 + }, + { + "epoch": 3.29, + "learning_rate": 8.384272997032642e-06, + "loss": 1.0926, + "step": 22280 + }, + { + "epoch": 3.29, + "eval_loss": 1.0674867630004883, + "eval_runtime": 519.8586, + "eval_samples_per_second": 14.694, + "eval_wer": 0.3709654364047, + "step": 22280 + }, + { + "epoch": 3.3, + "learning_rate": 8.381305637982196e-06, + "loss": 1.1912, + "step": 22320 + }, + { + "epoch": 3.3, + "eval_loss": 1.118621587753296, + "eval_runtime": 515.8764, + "eval_samples_per_second": 14.808, + "eval_wer": 0.3758540838788988, + "step": 22320 + }, + { + "epoch": 3.31, + "learning_rate": 8.37833827893175e-06, + "loss": 1.2248, + "step": 22360 + }, + { + "epoch": 3.31, + "eval_loss": 1.0436322689056396, + "eval_runtime": 515.9987, + "eval_samples_per_second": 14.804, + "eval_wer": 0.3697075388089997, + "step": 22360 + }, + { + "epoch": 3.31, + "learning_rate": 8.375370919881307e-06, + "loss": 1.082, + "step": 22400 + }, + { + "epoch": 3.31, + "eval_loss": 1.1002633571624756, + "eval_runtime": 516.5189, + "eval_samples_per_second": 14.789, + "eval_wer": 0.3738528831584665, + "step": 22400 + }, + { + "epoch": 3.32, + "learning_rate": 8.372403560830861e-06, + "loss": 1.1479, + "step": 22440 + }, + { + "epoch": 3.32, + "eval_loss": 1.069524884223938, + "eval_runtime": 518.569, + "eval_samples_per_second": 14.731, + "eval_wer": 0.37067955058749535, + "step": 22440 + }, + { + "epoch": 3.32, + "learning_rate": 8.369436201780416e-06, + "loss": 1.13, + "step": 22480 + }, + { + "epoch": 3.32, + "eval_loss": 1.0654046535491943, + "eval_runtime": 517.2424, + "eval_samples_per_second": 14.769, + "eval_wer": 0.37059378484233396, + "step": 22480 + }, + { + "epoch": 3.33, + "learning_rate": 8.366468842729972e-06, + "loss": 1.1767, + "step": 22520 + }, + { + "epoch": 3.33, + "eval_loss": 1.0833700895309448, + "eval_runtime": 518.2564, + "eval_samples_per_second": 14.74, + "eval_wer": 0.3719660367649161, + "step": 22520 + }, + { + "epoch": 3.33, + "learning_rate": 8.363501483679526e-06, + "loss": 1.1744, + "step": 22560 + }, + { + "epoch": 3.33, + "eval_loss": 1.0505093336105347, + "eval_runtime": 517.9745, + "eval_samples_per_second": 14.748, + "eval_wer": 0.36982189313588154, + "step": 22560 + }, + { + "epoch": 3.34, + "learning_rate": 8.36053412462908e-06, + "loss": 1.083, + "step": 22600 + }, + { + "epoch": 3.34, + "eval_loss": 1.1251804828643799, + "eval_runtime": 516.7801, + "eval_samples_per_second": 14.782, + "eval_wer": 0.37462477486491896, + "step": 22600 + }, + { + "epoch": 3.35, + "learning_rate": 8.357566765578635e-06, + "loss": 1.1415, + "step": 22640 + }, + { + "epoch": 3.35, + "eval_loss": 1.0841988325119019, + "eval_runtime": 517.5365, + "eval_samples_per_second": 14.76, + "eval_wer": 0.37082249349609764, + "step": 22640 + }, + { + "epoch": 3.35, + "learning_rate": 8.354599406528191e-06, + "loss": 1.1524, + "step": 22680 + }, + { + "epoch": 3.35, + "eval_loss": 1.0576471090316772, + "eval_runtime": 518.7579, + "eval_samples_per_second": 14.726, + "eval_wer": 0.36907859001114957, + "step": 22680 + }, + { + "epoch": 3.36, + "learning_rate": 8.351632047477746e-06, + "loss": 1.1323, + "step": 22720 + }, + { + "epoch": 3.36, + "eval_loss": 1.0637476444244385, + "eval_runtime": 516.7292, + "eval_samples_per_second": 14.783, + "eval_wer": 0.3692501215014723, + "step": 22720 + }, + { + "epoch": 3.36, + "learning_rate": 8.3486646884273e-06, + "loss": 1.2781, + "step": 22760 + }, + { + "epoch": 3.36, + "eval_loss": 1.008151888847351, + "eval_runtime": 519.0821, + "eval_samples_per_second": 14.716, + "eval_wer": 0.36716315503587865, + "step": 22760 + }, + { + "epoch": 3.37, + "learning_rate": 8.345697329376855e-06, + "loss": 1.1216, + "step": 22800 + }, + { + "epoch": 3.37, + "eval_loss": 1.0557352304458618, + "eval_runtime": 516.7109, + "eval_samples_per_second": 14.784, + "eval_wer": 0.36947883015523597, + "step": 22800 + }, + { + "epoch": 3.38, + "learning_rate": 8.342729970326409e-06, + "loss": 1.0908, + "step": 22840 + }, + { + "epoch": 3.38, + "eval_loss": 1.0651558637619019, + "eval_runtime": 521.9658, + "eval_samples_per_second": 14.635, + "eval_wer": 0.37042225335201123, + "step": 22840 + }, + { + "epoch": 3.38, + "learning_rate": 8.339762611275965e-06, + "loss": 1.1704, + "step": 22880 + }, + { + "epoch": 3.38, + "eval_loss": 1.036316990852356, + "eval_runtime": 518.103, + "eval_samples_per_second": 14.744, + "eval_wer": 0.36733468652620144, + "step": 22880 + }, + { + "epoch": 3.39, + "learning_rate": 8.33679525222552e-06, + "loss": 1.1227, + "step": 22920 + }, + { + "epoch": 3.39, + "eval_loss": 1.0647050142288208, + "eval_runtime": 516.7891, + "eval_samples_per_second": 14.782, + "eval_wer": 0.36936447582835413, + "step": 22920 + }, + { + "epoch": 3.39, + "learning_rate": 8.333827893175074e-06, + "loss": 1.2202, + "step": 22960 + }, + { + "epoch": 3.39, + "eval_loss": 1.0371829271316528, + "eval_runtime": 523.8129, + "eval_samples_per_second": 14.583, + "eval_wer": 0.3668772692186741, + "step": 22960 + }, + { + "epoch": 3.4, + "learning_rate": 8.33086053412463e-06, + "loss": 1.1552, + "step": 23000 + }, + { + "epoch": 3.4, + "eval_loss": 1.0524778366088867, + "eval_runtime": 519.4488, + "eval_samples_per_second": 14.706, + "eval_wer": 0.36767774950684695, + "step": 23000 + }, + { + "epoch": 3.41, + "learning_rate": 8.327893175074185e-06, + "loss": 1.1128, + "step": 23040 + }, + { + "epoch": 3.41, + "eval_loss": 1.1172667741775513, + "eval_runtime": 516.835, + "eval_samples_per_second": 14.78, + "eval_wer": 0.37316675719717546, + "step": 23040 + }, + { + "epoch": 3.41, + "learning_rate": 8.32492581602374e-06, + "loss": 1.1093, + "step": 23080 + }, + { + "epoch": 3.41, + "eval_loss": 1.1036713123321533, + "eval_runtime": 517.089, + "eval_samples_per_second": 14.773, + "eval_wer": 0.37170873952943195, + "step": 23080 + }, + { + "epoch": 3.42, + "learning_rate": 8.321958456973295e-06, + "loss": 1.0859, + "step": 23120 + }, + { + "epoch": 3.42, + "eval_loss": 1.1004812717437744, + "eval_runtime": 517.8694, + "eval_samples_per_second": 14.751, + "eval_wer": 0.370222133279968, + "step": 23120 + }, + { + "epoch": 3.42, + "learning_rate": 8.31899109792285e-06, + "loss": 1.2882, + "step": 23160 + }, + { + "epoch": 3.42, + "eval_loss": 1.00663161277771, + "eval_runtime": 517.4839, + "eval_samples_per_second": 14.762, + "eval_wer": 0.3639612338831871, + "step": 23160 + }, + { + "epoch": 3.43, + "learning_rate": 8.316023738872404e-06, + "loss": 1.0962, + "step": 23200 + }, + { + "epoch": 3.43, + "eval_loss": 1.072790503501892, + "eval_runtime": 518.273, + "eval_samples_per_second": 14.739, + "eval_wer": 0.36922153291975185, + "step": 23200 + }, + { + "epoch": 3.44, + "learning_rate": 8.313056379821959e-06, + "loss": 1.1342, + "step": 23240 + }, + { + "epoch": 3.44, + "eval_loss": 1.0271384716033936, + "eval_runtime": 516.6922, + "eval_samples_per_second": 14.784, + "eval_wer": 0.3655050172960919, + "step": 23240 + }, + { + "epoch": 3.44, + "learning_rate": 8.310089020771515e-06, + "loss": 1.1378, + "step": 23280 + }, + { + "epoch": 3.44, + "eval_loss": 1.0719366073608398, + "eval_runtime": 516.6829, + "eval_samples_per_second": 14.785, + "eval_wer": 0.36887846993910633, + "step": 23280 + }, + { + "epoch": 3.45, + "learning_rate": 8.30712166172107e-06, + "loss": 1.1153, + "step": 23320 + }, + { + "epoch": 3.45, + "eval_loss": 1.0656384229660034, + "eval_runtime": 516.8124, + "eval_samples_per_second": 14.781, + "eval_wer": 0.3677921038337288, + "step": 23320 + }, + { + "epoch": 3.45, + "learning_rate": 8.304154302670624e-06, + "loss": 1.1001, + "step": 23360 + }, + { + "epoch": 3.45, + "eval_loss": 1.055397868156433, + "eval_runtime": 519.5407, + "eval_samples_per_second": 14.703, + "eval_wer": 0.36762057234340606, + "step": 23360 + }, + { + "epoch": 3.46, + "learning_rate": 8.301186943620178e-06, + "loss": 1.136, + "step": 23400 + }, + { + "epoch": 3.46, + "eval_loss": 1.0536446571350098, + "eval_runtime": 517.5237, + "eval_samples_per_second": 14.761, + "eval_wer": 0.3672775093627605, + "step": 23400 + }, + { + "epoch": 3.46, + "learning_rate": 8.298219584569732e-06, + "loss": 1.1053, + "step": 23440 + }, + { + "epoch": 3.46, + "eval_loss": 1.0973440408706665, + "eval_runtime": 519.4106, + "eval_samples_per_second": 14.707, + "eval_wer": 0.3721661568369593, + "step": 23440 + }, + { + "epoch": 3.47, + "learning_rate": 8.295252225519289e-06, + "loss": 1.0365, + "step": 23480 + }, + { + "epoch": 3.47, + "eval_loss": 1.1153208017349243, + "eval_runtime": 517.4335, + "eval_samples_per_second": 14.763, + "eval_wer": 0.3738528831584665, + "step": 23480 + }, + { + "epoch": 3.48, + "learning_rate": 8.292284866468843e-06, + "loss": 1.115, + "step": 23520 + }, + { + "epoch": 3.48, + "eval_loss": 1.1201342344284058, + "eval_runtime": 518.773, + "eval_samples_per_second": 14.725, + "eval_wer": 0.3734240544326596, + "step": 23520 + }, + { + "epoch": 3.48, + "learning_rate": 8.2893175074184e-06, + "loss": 1.2185, + "step": 23560 + }, + { + "epoch": 3.48, + "eval_loss": 1.0548752546310425, + "eval_runtime": 517.8173, + "eval_samples_per_second": 14.752, + "eval_wer": 0.36767774950684695, + "step": 23560 + }, + { + "epoch": 3.49, + "learning_rate": 8.286350148367954e-06, + "loss": 1.0682, + "step": 23600 + }, + { + "epoch": 3.49, + "eval_loss": 1.068299412727356, + "eval_runtime": 517.834, + "eval_samples_per_second": 14.752, + "eval_wer": 0.36836387546813804, + "step": 23600 + }, + { + "epoch": 3.49, + "learning_rate": 8.283382789317508e-06, + "loss": 1.0768, + "step": 23640 + }, + { + "epoch": 3.49, + "eval_loss": 1.0500787496566772, + "eval_runtime": 517.6031, + "eval_samples_per_second": 14.758, + "eval_wer": 0.36667714914663085, + "step": 23640 + }, + { + "epoch": 3.5, + "learning_rate": 8.280415430267063e-06, + "loss": 1.1716, + "step": 23680 + }, + { + "epoch": 3.5, + "eval_loss": 1.0508309602737427, + "eval_runtime": 519.4506, + "eval_samples_per_second": 14.706, + "eval_wer": 0.3680208124874925, + "step": 23680 + }, + { + "epoch": 3.51, + "learning_rate": 8.277448071216619e-06, + "loss": 1.0896, + "step": 23720 + }, + { + "epoch": 3.51, + "eval_loss": 1.0668442249298096, + "eval_runtime": 522.7169, + "eval_samples_per_second": 14.614, + "eval_wer": 0.3689356471025472, + "step": 23720 + }, + { + "epoch": 3.51, + "learning_rate": 8.274480712166173e-06, + "loss": 1.1627, + "step": 23760 + }, + { + "epoch": 3.51, + "eval_loss": 1.0905144214630127, + "eval_runtime": 519.23, + "eval_samples_per_second": 14.712, + "eval_wer": 0.3708796706595386, + "step": 23760 + }, + { + "epoch": 3.52, + "learning_rate": 8.271513353115728e-06, + "loss": 1.0731, + "step": 23800 + }, + { + "epoch": 3.52, + "eval_loss": 1.0570732355117798, + "eval_runtime": 518.7712, + "eval_samples_per_second": 14.725, + "eval_wer": 0.3670488007089968, + "step": 23800 + }, + { + "epoch": 3.52, + "learning_rate": 8.268545994065282e-06, + "loss": 1.066, + "step": 23840 + }, + { + "epoch": 3.52, + "eval_loss": 1.103662371635437, + "eval_runtime": 519.1503, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3707081391692158, + "step": 23840 + }, + { + "epoch": 3.53, + "learning_rate": 8.265578635014836e-06, + "loss": 1.0388, + "step": 23880 + }, + { + "epoch": 3.53, + "eval_loss": 1.1405856609344482, + "eval_runtime": 517.7202, + "eval_samples_per_second": 14.755, + "eval_wer": 0.37316675719717546, + "step": 23880 + }, + { + "epoch": 3.54, + "learning_rate": 8.262611275964393e-06, + "loss": 1.1448, + "step": 23920 + }, + { + "epoch": 3.54, + "eval_loss": 1.040247917175293, + "eval_runtime": 517.268, + "eval_samples_per_second": 14.768, + "eval_wer": 0.3650190114068441, + "step": 23920 + }, + { + "epoch": 3.54, + "learning_rate": 8.259643916913947e-06, + "loss": 1.1541, + "step": 23960 + }, + { + "epoch": 3.54, + "eval_loss": 1.1075586080551147, + "eval_runtime": 519.0155, + "eval_samples_per_second": 14.718, + "eval_wer": 0.3707939049143772, + "step": 23960 + }, + { + "epoch": 3.55, + "learning_rate": 8.256676557863501e-06, + "loss": 1.0155, + "step": 24000 + }, + { + "epoch": 3.55, + "eval_loss": 1.1373422145843506, + "eval_runtime": 518.0162, + "eval_samples_per_second": 14.747, + "eval_wer": 0.37368135166814376, + "step": 24000 + }, + { + "epoch": 3.55, + "learning_rate": 8.253709198813058e-06, + "loss": 1.0957, + "step": 24040 + }, + { + "epoch": 3.55, + "eval_loss": 1.105931043624878, + "eval_runtime": 518.0639, + "eval_samples_per_second": 14.745, + "eval_wer": 0.3700506017896452, + "step": 24040 + }, + { + "epoch": 3.56, + "learning_rate": 8.250741839762612e-06, + "loss": 1.1577, + "step": 24080 + }, + { + "epoch": 3.56, + "eval_loss": 1.078569769859314, + "eval_runtime": 517.2465, + "eval_samples_per_second": 14.769, + "eval_wer": 0.36804940106921297, + "step": 24080 + }, + { + "epoch": 3.57, + "learning_rate": 8.247774480712168e-06, + "loss": 1.1332, + "step": 24120 + }, + { + "epoch": 3.57, + "eval_loss": 1.0760174989700317, + "eval_runtime": 520.4801, + "eval_samples_per_second": 14.677, + "eval_wer": 0.36702021212727637, + "step": 24120 + }, + { + "epoch": 3.57, + "learning_rate": 8.244807121661723e-06, + "loss": 1.0911, + "step": 24160 + }, + { + "epoch": 3.57, + "eval_loss": 1.0997047424316406, + "eval_runtime": 517.5382, + "eval_samples_per_second": 14.76, + "eval_wer": 0.36793504674233113, + "step": 24160 + }, + { + "epoch": 3.58, + "learning_rate": 8.241839762611277e-06, + "loss": 1.1245, + "step": 24200 + }, + { + "epoch": 3.58, + "eval_loss": 1.0997531414031982, + "eval_runtime": 515.9246, + "eval_samples_per_second": 14.806, + "eval_wer": 0.3678206924154493, + "step": 24200 + }, + { + "epoch": 3.58, + "learning_rate": 8.238872403560831e-06, + "loss": 1.1391, + "step": 24240 + }, + { + "epoch": 3.58, + "eval_loss": 1.0964620113372803, + "eval_runtime": 520.2211, + "eval_samples_per_second": 14.684, + "eval_wer": 0.36819234397781525, + "step": 24240 + }, + { + "epoch": 3.59, + "learning_rate": 8.235905044510386e-06, + "loss": 1.1152, + "step": 24280 + }, + { + "epoch": 3.59, + "eval_loss": 1.0755976438522339, + "eval_runtime": 516.3352, + "eval_samples_per_second": 14.795, + "eval_wer": 0.3670773892907173, + "step": 24280 + }, + { + "epoch": 3.59, + "learning_rate": 8.232937685459942e-06, + "loss": 1.094, + "step": 24320 + }, + { + "epoch": 3.59, + "eval_loss": 1.0678706169128418, + "eval_runtime": 517.2245, + "eval_samples_per_second": 14.769, + "eval_wer": 0.36599102318533977, + "step": 24320 + }, + { + "epoch": 3.6, + "learning_rate": 8.229970326409497e-06, + "loss": 1.1609, + "step": 24360 + }, + { + "epoch": 3.6, + "eval_loss": 1.0418184995651245, + "eval_runtime": 515.3716, + "eval_samples_per_second": 14.822, + "eval_wer": 0.36358958232082106, + "step": 24360 + }, + { + "epoch": 3.61, + "learning_rate": 8.227002967359051e-06, + "loss": 1.0954, + "step": 24400 + }, + { + "epoch": 3.61, + "eval_loss": 1.0680294036865234, + "eval_runtime": 517.1544, + "eval_samples_per_second": 14.771, + "eval_wer": 0.36587666885845793, + "step": 24400 + }, + { + "epoch": 3.61, + "learning_rate": 8.224035608308605e-06, + "loss": 1.1367, + "step": 24440 + }, + { + "epoch": 3.61, + "eval_loss": 1.0559535026550293, + "eval_runtime": 515.8217, + "eval_samples_per_second": 14.809, + "eval_wer": 0.364390062608994, + "step": 24440 + }, + { + "epoch": 3.62, + "learning_rate": 8.22106824925816e-06, + "loss": 1.0914, + "step": 24480 + }, + { + "epoch": 3.62, + "eval_loss": 1.1288807392120361, + "eval_runtime": 518.94, + "eval_samples_per_second": 14.72, + "eval_wer": 0.37016495611652706, + "step": 24480 + }, + { + "epoch": 3.62, + "learning_rate": 8.218100890207716e-06, + "loss": 1.195, + "step": 24520 + }, + { + "epoch": 3.62, + "eval_loss": 1.1092766523361206, + "eval_runtime": 516.7451, + "eval_samples_per_second": 14.783, + "eval_wer": 0.36884988135738583, + "step": 24520 + }, + { + "epoch": 3.63, + "learning_rate": 8.21513353115727e-06, + "loss": 1.172, + "step": 24560 + }, + { + "epoch": 3.63, + "eval_loss": 1.0519130229949951, + "eval_runtime": 515.9934, + "eval_samples_per_second": 14.804, + "eval_wer": 0.3642185311186712, + "step": 24560 + }, + { + "epoch": 3.64, + "learning_rate": 8.212166172106827e-06, + "loss": 1.0242, + "step": 24600 + }, + { + "epoch": 3.64, + "eval_loss": 1.1354796886444092, + "eval_runtime": 516.7768, + "eval_samples_per_second": 14.782, + "eval_wer": 0.37082249349609764, + "step": 24600 + }, + { + "epoch": 3.64, + "learning_rate": 8.209198813056381e-06, + "loss": 1.1394, + "step": 24640 + }, + { + "epoch": 3.64, + "eval_loss": 1.0994917154312134, + "eval_runtime": 520.2214, + "eval_samples_per_second": 14.684, + "eval_wer": 0.3679064581606106, + "step": 24640 + }, + { + "epoch": 3.65, + "learning_rate": 8.206231454005935e-06, + "loss": 1.16, + "step": 24680 + }, + { + "epoch": 3.65, + "eval_loss": 1.1076852083206177, + "eval_runtime": 516.5948, + "eval_samples_per_second": 14.787, + "eval_wer": 0.3685925841219017, + "step": 24680 + }, + { + "epoch": 3.65, + "learning_rate": 8.20326409495549e-06, + "loss": 1.1059, + "step": 24720 + }, + { + "epoch": 3.65, + "eval_loss": 1.0564041137695312, + "eval_runtime": 515.4181, + "eval_samples_per_second": 14.821, + "eval_wer": 0.3645615940993167, + "step": 24720 + }, + { + "epoch": 3.66, + "learning_rate": 8.200296735905046e-06, + "loss": 1.1476, + "step": 24760 + }, + { + "epoch": 3.66, + "eval_loss": 1.0685328245162964, + "eval_runtime": 518.6712, + "eval_samples_per_second": 14.728, + "eval_wer": 0.3660482003487807, + "step": 24760 + }, + { + "epoch": 3.67, + "learning_rate": 8.1973293768546e-06, + "loss": 1.1303, + "step": 24800 + }, + { + "epoch": 3.67, + "eval_loss": 1.0972750186920166, + "eval_runtime": 515.8094, + "eval_samples_per_second": 14.81, + "eval_wer": 0.3673632751079219, + "step": 24800 + }, + { + "epoch": 3.67, + "learning_rate": 8.194362017804155e-06, + "loss": 1.1167, + "step": 24840 + }, + { + "epoch": 3.67, + "eval_loss": 1.1154098510742188, + "eval_runtime": 515.6336, + "eval_samples_per_second": 14.815, + "eval_wer": 0.36950741873695647, + "step": 24840 + }, + { + "epoch": 3.68, + "learning_rate": 8.19139465875371e-06, + "loss": 1.1049, + "step": 24880 + }, + { + "epoch": 3.68, + "eval_loss": 1.106859564781189, + "eval_runtime": 516.1191, + "eval_samples_per_second": 14.801, + "eval_wer": 0.36982189313588154, + "step": 24880 + }, + { + "epoch": 3.68, + "learning_rate": 8.188427299703264e-06, + "loss": 1.1067, + "step": 24920 + }, + { + "epoch": 3.68, + "eval_loss": 1.0598785877227783, + "eval_runtime": 515.125, + "eval_samples_per_second": 14.829, + "eval_wer": 0.36504759998856456, + "step": 24920 + }, + { + "epoch": 3.69, + "learning_rate": 8.18545994065282e-06, + "loss": 1.1173, + "step": 24960 + }, + { + "epoch": 3.69, + "eval_loss": 1.0663487911224365, + "eval_runtime": 515.8422, + "eval_samples_per_second": 14.809, + "eval_wer": 0.3652477200606078, + "step": 24960 + }, + { + "epoch": 3.7, + "learning_rate": 8.182492581602374e-06, + "loss": 1.0819, + "step": 25000 + }, + { + "epoch": 3.7, + "eval_loss": 1.138964056968689, + "eval_runtime": 517.6711, + "eval_samples_per_second": 14.756, + "eval_wer": 0.37185168243803424, + "step": 25000 + }, + { + "epoch": 3.7, + "learning_rate": 8.179525222551929e-06, + "loss": 1.1119, + "step": 25040 + }, + { + "epoch": 3.7, + "eval_loss": 1.0933104753494263, + "eval_runtime": 515.7148, + "eval_samples_per_second": 14.812, + "eval_wer": 0.36767774950684695, + "step": 25040 + }, + { + "epoch": 3.71, + "learning_rate": 8.176557863501485e-06, + "loss": 1.177, + "step": 25080 + }, + { + "epoch": 3.71, + "eval_loss": 1.0523161888122559, + "eval_runtime": 515.8194, + "eval_samples_per_second": 14.809, + "eval_wer": 0.3640755882100689, + "step": 25080 + }, + { + "epoch": 3.71, + "learning_rate": 8.17359050445104e-06, + "loss": 1.2028, + "step": 25120 + }, + { + "epoch": 3.71, + "eval_loss": 1.0355265140533447, + "eval_runtime": 517.6105, + "eval_samples_per_second": 14.758, + "eval_wer": 0.3639040567197461, + "step": 25120 + }, + { + "epoch": 3.72, + "learning_rate": 8.170623145400594e-06, + "loss": 1.1015, + "step": 25160 + }, + { + "epoch": 3.72, + "eval_loss": 1.0511356592178345, + "eval_runtime": 516.9536, + "eval_samples_per_second": 14.777, + "eval_wer": 0.3656193716229738, + "step": 25160 + }, + { + "epoch": 3.72, + "learning_rate": 8.16765578635015e-06, + "loss": 1.1465, + "step": 25200 + }, + { + "epoch": 3.72, + "eval_loss": 1.0351282358169556, + "eval_runtime": 516.6468, + "eval_samples_per_second": 14.786, + "eval_wer": 0.3644186511907144, + "step": 25200 + }, + { + "epoch": 3.73, + "learning_rate": 8.164688427299704e-06, + "loss": 1.1222, + "step": 25240 + }, + { + "epoch": 3.73, + "eval_loss": 1.0622466802597046, + "eval_runtime": 518.7119, + "eval_samples_per_second": 14.727, + "eval_wer": 0.36504759998856456, + "step": 25240 + }, + { + "epoch": 3.74, + "learning_rate": 8.161721068249259e-06, + "loss": 1.2099, + "step": 25280 + }, + { + "epoch": 3.74, + "eval_loss": 1.0469032526016235, + "eval_runtime": 518.1251, + "eval_samples_per_second": 14.744, + "eval_wer": 0.3653906629692101, + "step": 25280 + }, + { + "epoch": 3.74, + "learning_rate": 8.158753709198813e-06, + "loss": 1.1178, + "step": 25320 + }, + { + "epoch": 3.74, + "eval_loss": 1.1052197217941284, + "eval_runtime": 517.3051, + "eval_samples_per_second": 14.767, + "eval_wer": 0.36973612739072015, + "step": 25320 + }, + { + "epoch": 3.75, + "learning_rate": 8.15578635014837e-06, + "loss": 1.0591, + "step": 25360 + }, + { + "epoch": 3.75, + "eval_loss": 1.0602738857269287, + "eval_runtime": 521.1006, + "eval_samples_per_second": 14.659, + "eval_wer": 0.3660482003487807, + "step": 25360 + }, + { + "epoch": 3.75, + "learning_rate": 8.152818991097924e-06, + "loss": 1.1197, + "step": 25400 + }, + { + "epoch": 3.75, + "eval_loss": 1.06788969039917, + "eval_runtime": 518.0218, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3669630349638354, + "step": 25400 + }, + { + "epoch": 3.76, + "learning_rate": 8.149851632047478e-06, + "loss": 1.1959, + "step": 25440 + }, + { + "epoch": 3.76, + "eval_loss": 1.0256024599075317, + "eval_runtime": 517.3151, + "eval_samples_per_second": 14.767, + "eval_wer": 0.36381829097458473, + "step": 25440 + }, + { + "epoch": 3.77, + "learning_rate": 8.146884272997033e-06, + "loss": 1.1873, + "step": 25480 + }, + { + "epoch": 3.77, + "eval_loss": 1.0199776887893677, + "eval_runtime": 518.2312, + "eval_samples_per_second": 14.741, + "eval_wer": 0.36330369650361644, + "step": 25480 + }, + { + "epoch": 3.77, + "learning_rate": 8.143916913946587e-06, + "loss": 1.0616, + "step": 25520 + }, + { + "epoch": 3.77, + "eval_loss": 1.0315873622894287, + "eval_runtime": 518.463, + "eval_samples_per_second": 14.734, + "eval_wer": 0.36250321621544357, + "step": 25520 + }, + { + "epoch": 3.78, + "learning_rate": 8.140949554896143e-06, + "loss": 1.1199, + "step": 25560 + }, + { + "epoch": 3.78, + "eval_loss": 0.9859173893928528, + "eval_runtime": 518.8125, + "eval_samples_per_second": 14.724, + "eval_wer": 0.3588152891735041, + "step": 25560 + }, + { + "epoch": 3.78, + "learning_rate": 8.137982195845698e-06, + "loss": 1.1564, + "step": 25600 + }, + { + "epoch": 3.78, + "eval_loss": 1.0701929330825806, + "eval_runtime": 515.7523, + "eval_samples_per_second": 14.811, + "eval_wer": 0.3656765487864147, + "step": 25600 + }, + { + "epoch": 3.79, + "learning_rate": 8.135014836795254e-06, + "loss": 1.1339, + "step": 25640 + }, + { + "epoch": 3.79, + "eval_loss": 1.0335668325424194, + "eval_runtime": 515.7591, + "eval_samples_per_second": 14.811, + "eval_wer": 0.3619028559993139, + "step": 25640 + }, + { + "epoch": 3.8, + "learning_rate": 8.132047477744808e-06, + "loss": 1.1867, + "step": 25680 + }, + { + "epoch": 3.8, + "eval_loss": 1.0504717826843262, + "eval_runtime": 515.9514, + "eval_samples_per_second": 14.806, + "eval_wer": 0.36316075359501415, + "step": 25680 + }, + { + "epoch": 3.8, + "learning_rate": 8.129080118694363e-06, + "loss": 1.1478, + "step": 25720 + }, + { + "epoch": 3.8, + "eval_loss": 1.0441105365753174, + "eval_runtime": 515.5364, + "eval_samples_per_second": 14.818, + "eval_wer": 0.3629320449412505, + "step": 25720 + }, + { + "epoch": 3.81, + "learning_rate": 8.126112759643917e-06, + "loss": 1.093, + "step": 25760 + }, + { + "epoch": 3.81, + "eval_loss": 1.0589814186096191, + "eval_runtime": 520.1955, + "eval_samples_per_second": 14.685, + "eval_wer": 0.3634752279939392, + "step": 25760 + }, + { + "epoch": 3.81, + "learning_rate": 8.123145400593473e-06, + "loss": 1.1165, + "step": 25800 + }, + { + "epoch": 3.81, + "eval_loss": 1.0844630002975464, + "eval_runtime": 517.0896, + "eval_samples_per_second": 14.773, + "eval_wer": 0.36616255467566255, + "step": 25800 + }, + { + "epoch": 3.82, + "learning_rate": 8.120178041543028e-06, + "loss": 1.1626, + "step": 25840 + }, + { + "epoch": 3.82, + "eval_loss": 1.0531216859817505, + "eval_runtime": 515.9262, + "eval_samples_per_second": 14.806, + "eval_wer": 0.36301781068641187, + "step": 25840 + }, + { + "epoch": 3.83, + "learning_rate": 8.117210682492582e-06, + "loss": 1.0662, + "step": 25880 + }, + { + "epoch": 3.83, + "eval_loss": 1.0907328128814697, + "eval_runtime": 515.6628, + "eval_samples_per_second": 14.814, + "eval_wer": 0.36613396609394205, + "step": 25880 + }, + { + "epoch": 3.83, + "learning_rate": 8.114243323442137e-06, + "loss": 1.1121, + "step": 25920 + }, + { + "epoch": 3.83, + "eval_loss": 1.0909258127212524, + "eval_runtime": 515.7883, + "eval_samples_per_second": 14.81, + "eval_wer": 0.36573372594985565, + "step": 25920 + }, + { + "epoch": 3.84, + "learning_rate": 8.111275964391691e-06, + "loss": 1.098, + "step": 25960 + }, + { + "epoch": 3.84, + "eval_loss": 1.0629509687423706, + "eval_runtime": 516.5212, + "eval_samples_per_second": 14.789, + "eval_wer": 0.36333228508533694, + "step": 25960 + }, + { + "epoch": 3.84, + "learning_rate": 8.108308605341247e-06, + "loss": 1.2379, + "step": 26000 + }, + { + "epoch": 3.84, + "eval_loss": 1.0843515396118164, + "eval_runtime": 518.1159, + "eval_samples_per_second": 14.744, + "eval_wer": 0.36479030275308044, + "step": 26000 + }, + { + "epoch": 3.85, + "learning_rate": 8.105341246290802e-06, + "loss": 1.1516, + "step": 26040 + }, + { + "epoch": 3.85, + "eval_loss": 1.1244564056396484, + "eval_runtime": 516.0322, + "eval_samples_per_second": 14.803, + "eval_wer": 0.36999342462620427, + "step": 26040 + }, + { + "epoch": 3.86, + "learning_rate": 8.102373887240356e-06, + "loss": 1.177, + "step": 26080 + }, + { + "epoch": 3.86, + "eval_loss": 1.0700942277908325, + "eval_runtime": 516.3542, + "eval_samples_per_second": 14.794, + "eval_wer": 0.3651619543154464, + "step": 26080 + }, + { + "epoch": 3.86, + "learning_rate": 8.099406528189912e-06, + "loss": 1.1204, + "step": 26120 + }, + { + "epoch": 3.86, + "eval_loss": 1.0095574855804443, + "eval_runtime": 516.59, + "eval_samples_per_second": 14.787, + "eval_wer": 0.3605591926584522, + "step": 26120 + }, + { + "epoch": 3.87, + "learning_rate": 8.096439169139467e-06, + "loss": 1.1602, + "step": 26160 + }, + { + "epoch": 3.87, + "eval_loss": 1.064212441444397, + "eval_runtime": 520.8222, + "eval_samples_per_second": 14.667, + "eval_wer": 0.3659624346036193, + "step": 26160 + }, + { + "epoch": 3.87, + "learning_rate": 8.093471810089021e-06, + "loss": 1.1287, + "step": 26200 + }, + { + "epoch": 3.87, + "eval_loss": 1.0908650159835815, + "eval_runtime": 518.0714, + "eval_samples_per_second": 14.745, + "eval_wer": 0.3680208124874925, + "step": 26200 + }, + { + "epoch": 3.88, + "learning_rate": 8.090504451038577e-06, + "loss": 1.1323, + "step": 26240 + }, + { + "epoch": 3.88, + "eval_loss": 1.0467941761016846, + "eval_runtime": 516.9694, + "eval_samples_per_second": 14.777, + "eval_wer": 0.36453300551759626, + "step": 26240 + }, + { + "epoch": 3.88, + "learning_rate": 8.087537091988132e-06, + "loss": 1.1587, + "step": 26280 + }, + { + "epoch": 3.88, + "eval_loss": 1.0467596054077148, + "eval_runtime": 521.8601, + "eval_samples_per_second": 14.638, + "eval_wer": 0.3640469996283484, + "step": 26280 + }, + { + "epoch": 3.89, + "learning_rate": 8.084569732937686e-06, + "loss": 1.1589, + "step": 26320 + }, + { + "epoch": 3.89, + "eval_loss": 1.0611344575881958, + "eval_runtime": 517.6593, + "eval_samples_per_second": 14.757, + "eval_wer": 0.3658480802767375, + "step": 26320 + }, + { + "epoch": 3.9, + "learning_rate": 8.08160237388724e-06, + "loss": 1.1345, + "step": 26360 + }, + { + "epoch": 3.9, + "eval_loss": 1.052765965461731, + "eval_runtime": 515.9981, + "eval_samples_per_second": 14.804, + "eval_wer": 0.3649904228251237, + "step": 26360 + }, + { + "epoch": 3.9, + "learning_rate": 8.078635014836797e-06, + "loss": 1.1395, + "step": 26400 + }, + { + "epoch": 3.9, + "eval_loss": 0.9894335865974426, + "eval_runtime": 518.2458, + "eval_samples_per_second": 14.74, + "eval_wer": 0.35955859229823606, + "step": 26400 + }, + { + "epoch": 3.91, + "learning_rate": 8.075667655786351e-06, + "loss": 1.1246, + "step": 26440 + }, + { + "epoch": 3.91, + "eval_loss": 1.0771129131317139, + "eval_runtime": 517.2215, + "eval_samples_per_second": 14.769, + "eval_wer": 0.3663340861659853, + "step": 26440 + }, + { + "epoch": 3.91, + "learning_rate": 8.072700296735906e-06, + "loss": 1.0896, + "step": 26480 + }, + { + "epoch": 3.91, + "eval_loss": 1.0381693840026855, + "eval_runtime": 517.7439, + "eval_samples_per_second": 14.754, + "eval_wer": 0.36290345635953003, + "step": 26480 + }, + { + "epoch": 3.92, + "learning_rate": 8.06973293768546e-06, + "loss": 1.135, + "step": 26520 + }, + { + "epoch": 3.92, + "eval_loss": 1.0223528146743774, + "eval_runtime": 517.1343, + "eval_samples_per_second": 14.772, + "eval_wer": 0.36153120443694786, + "step": 26520 + }, + { + "epoch": 3.93, + "learning_rate": 8.066765578635015e-06, + "loss": 1.1318, + "step": 26560 + }, + { + "epoch": 3.93, + "eval_loss": 1.0759764909744263, + "eval_runtime": 518.1296, + "eval_samples_per_second": 14.743, + "eval_wer": 0.3655336058778124, + "step": 26560 + }, + { + "epoch": 3.93, + "learning_rate": 8.06379821958457e-06, + "loss": 1.1323, + "step": 26600 + }, + { + "epoch": 3.93, + "eval_loss": 1.0366358757019043, + "eval_runtime": 516.8923, + "eval_samples_per_second": 14.779, + "eval_wer": 0.36264615912404585, + "step": 26600 + }, + { + "epoch": 3.94, + "learning_rate": 8.060830860534125e-06, + "loss": 1.1466, + "step": 26640 + }, + { + "epoch": 3.94, + "eval_loss": 1.0218775272369385, + "eval_runtime": 516.4815, + "eval_samples_per_second": 14.79, + "eval_wer": 0.36221733039823895, + "step": 26640 + }, + { + "epoch": 3.94, + "learning_rate": 8.05786350148368e-06, + "loss": 1.1426, + "step": 26680 + }, + { + "epoch": 3.94, + "eval_loss": 1.0162721872329712, + "eval_runtime": 518.4885, + "eval_samples_per_second": 14.733, + "eval_wer": 0.36256039337888446, + "step": 26680 + }, + { + "epoch": 3.95, + "learning_rate": 8.054896142433236e-06, + "loss": 1.1036, + "step": 26720 + }, + { + "epoch": 3.95, + "eval_loss": 1.0971293449401855, + "eval_runtime": 517.183, + "eval_samples_per_second": 14.77, + "eval_wer": 0.36947883015523597, + "step": 26720 + }, + { + "epoch": 3.96, + "learning_rate": 8.05192878338279e-06, + "loss": 1.1136, + "step": 26760 + }, + { + "epoch": 3.96, + "eval_loss": 1.0138506889343262, + "eval_runtime": 516.7655, + "eval_samples_per_second": 14.782, + "eval_wer": 0.36110237571114095, + "step": 26760 + }, + { + "epoch": 3.96, + "learning_rate": 8.048961424332345e-06, + "loss": 1.1409, + "step": 26800 + }, + { + "epoch": 3.96, + "eval_loss": 1.062695026397705, + "eval_runtime": 515.9413, + "eval_samples_per_second": 14.806, + "eval_wer": 0.36504759998856456, + "step": 26800 + }, + { + "epoch": 3.97, + "learning_rate": 8.0459940652819e-06, + "loss": 1.1389, + "step": 26840 + }, + { + "epoch": 3.97, + "eval_loss": 1.0245001316070557, + "eval_runtime": 519.5194, + "eval_samples_per_second": 14.704, + "eval_wer": 0.36187426741759343, + "step": 26840 + }, + { + "epoch": 3.97, + "learning_rate": 8.043026706231455e-06, + "loss": 1.0802, + "step": 26880 + }, + { + "epoch": 3.97, + "eval_loss": 1.061140537261963, + "eval_runtime": 519.9835, + "eval_samples_per_second": 14.691, + "eval_wer": 0.3649904228251237, + "step": 26880 + }, + { + "epoch": 3.98, + "learning_rate": 8.04005934718101e-06, + "loss": 1.1457, + "step": 26920 + }, + { + "epoch": 3.98, + "eval_loss": 1.0712372064590454, + "eval_runtime": 516.9187, + "eval_samples_per_second": 14.778, + "eval_wer": 0.36639126332942623, + "step": 26920 + }, + { + "epoch": 3.99, + "learning_rate": 8.037091988130564e-06, + "loss": 1.0985, + "step": 26960 + }, + { + "epoch": 3.99, + "eval_loss": 1.0930147171020508, + "eval_runtime": 518.5479, + "eval_samples_per_second": 14.732, + "eval_wer": 0.3694502415735155, + "step": 26960 + }, + { + "epoch": 3.99, + "learning_rate": 8.034124629080118e-06, + "loss": 1.1048, + "step": 27000 + }, + { + "epoch": 3.99, + "eval_loss": 1.0739365816116333, + "eval_runtime": 517.5618, + "eval_samples_per_second": 14.76, + "eval_wer": 0.36682009205523314, + "step": 27000 + }, + { + "epoch": 4.0, + "learning_rate": 8.031157270029675e-06, + "loss": 1.1309, + "step": 27040 + }, + { + "epoch": 4.0, + "eval_loss": 0.9978883266448975, + "eval_runtime": 517.0385, + "eval_samples_per_second": 14.775, + "eval_wer": 0.36058778124017266, + "step": 27040 + }, + { + "epoch": 4.0, + "learning_rate": 8.028189910979229e-06, + "loss": 1.1336, + "step": 27080 + }, + { + "epoch": 4.0, + "eval_loss": 1.087448000907898, + "eval_runtime": 515.0292, + "eval_samples_per_second": 14.832, + "eval_wer": 0.3689070585208268, + "step": 27080 + }, + { + "epoch": 4.01, + "learning_rate": 8.025222551928783e-06, + "loss": 1.1451, + "step": 27120 + }, + { + "epoch": 4.01, + "eval_loss": 1.0311850309371948, + "eval_runtime": 514.574, + "eval_samples_per_second": 14.845, + "eval_wer": 0.3634180508304983, + "step": 27120 + }, + { + "epoch": 4.01, + "learning_rate": 8.022255192878338e-06, + "loss": 1.0441, + "step": 27160 + }, + { + "epoch": 4.01, + "eval_loss": 1.0641337633132935, + "eval_runtime": 516.4295, + "eval_samples_per_second": 14.792, + "eval_wer": 0.3659624346036193, + "step": 27160 + }, + { + "epoch": 4.02, + "learning_rate": 8.019287833827894e-06, + "loss": 1.1014, + "step": 27200 + }, + { + "epoch": 4.02, + "eval_loss": 1.084144949913025, + "eval_runtime": 514.9546, + "eval_samples_per_second": 14.834, + "eval_wer": 0.3676491609251265, + "step": 27200 + }, + { + "epoch": 4.03, + "learning_rate": 8.016320474777449e-06, + "loss": 1.1234, + "step": 27240 + }, + { + "epoch": 4.03, + "eval_loss": 1.0059243440628052, + "eval_runtime": 515.1532, + "eval_samples_per_second": 14.829, + "eval_wer": 0.3608736670573773, + "step": 27240 + }, + { + "epoch": 4.03, + "learning_rate": 8.013353115727005e-06, + "loss": 1.0651, + "step": 27280 + }, + { + "epoch": 4.03, + "eval_loss": 1.0333300828933716, + "eval_runtime": 516.0927, + "eval_samples_per_second": 14.802, + "eval_wer": 0.36290345635953003, + "step": 27280 + }, + { + "epoch": 4.04, + "learning_rate": 8.010385756676559e-06, + "loss": 1.044, + "step": 27320 + }, + { + "epoch": 4.04, + "eval_loss": 1.0695381164550781, + "eval_runtime": 521.8594, + "eval_samples_per_second": 14.638, + "eval_wer": 0.36527630864232824, + "step": 27320 + }, + { + "epoch": 4.04, + "learning_rate": 8.007418397626114e-06, + "loss": 1.1104, + "step": 27360 + }, + { + "epoch": 4.04, + "eval_loss": 1.029439091682434, + "eval_runtime": 516.081, + "eval_samples_per_second": 14.802, + "eval_wer": 0.36161697018210925, + "step": 27360 + }, + { + "epoch": 4.05, + "learning_rate": 8.004451038575668e-06, + "loss": 1.0236, + "step": 27400 + }, + { + "epoch": 4.05, + "eval_loss": 1.053420066833496, + "eval_runtime": 516.6495, + "eval_samples_per_second": 14.786, + "eval_wer": 0.363275107921896, + "step": 27400 + }, + { + "epoch": 4.06, + "learning_rate": 8.001483679525224e-06, + "loss": 1.2236, + "step": 27440 + }, + { + "epoch": 4.06, + "eval_loss": 1.102577567100525, + "eval_runtime": 520.996, + "eval_samples_per_second": 14.662, + "eval_wer": 0.36836387546813804, + "step": 27440 + }, + { + "epoch": 4.06, + "learning_rate": 7.998516320474779e-06, + "loss": 1.0476, + "step": 27480 + }, + { + "epoch": 4.06, + "eval_loss": 1.0757291316986084, + "eval_runtime": 517.8557, + "eval_samples_per_second": 14.751, + "eval_wer": 0.3649904228251237, + "step": 27480 + }, + { + "epoch": 4.07, + "learning_rate": 7.995548961424333e-06, + "loss": 1.0854, + "step": 27520 + }, + { + "epoch": 4.07, + "eval_loss": 1.046846866607666, + "eval_runtime": 517.9208, + "eval_samples_per_second": 14.749, + "eval_wer": 0.3630463992681323, + "step": 27520 + }, + { + "epoch": 4.07, + "learning_rate": 7.992581602373887e-06, + "loss": 1.0753, + "step": 27560 + }, + { + "epoch": 4.07, + "eval_loss": 1.0045180320739746, + "eval_runtime": 521.5964, + "eval_samples_per_second": 14.645, + "eval_wer": 0.35870093484662224, + "step": 27560 + }, + { + "epoch": 4.08, + "learning_rate": 7.989614243323442e-06, + "loss": 1.0949, + "step": 27600 + }, + { + "epoch": 4.08, + "eval_loss": 1.009703278541565, + "eval_runtime": 515.3541, + "eval_samples_per_second": 14.823, + "eval_wer": 0.35981588953372023, + "step": 27600 + }, + { + "epoch": 4.09, + "learning_rate": 7.986646884272998e-06, + "loss": 1.0591, + "step": 27640 + }, + { + "epoch": 4.09, + "eval_loss": 1.0759499073028564, + "eval_runtime": 516.4471, + "eval_samples_per_second": 14.791, + "eval_wer": 0.3659624346036193, + "step": 27640 + }, + { + "epoch": 4.09, + "learning_rate": 7.983679525222552e-06, + "loss": 1.1114, + "step": 27680 + }, + { + "epoch": 4.09, + "eval_loss": 1.0098916292190552, + "eval_runtime": 515.313, + "eval_samples_per_second": 14.824, + "eval_wer": 0.3604734269132908, + "step": 27680 + }, + { + "epoch": 4.1, + "learning_rate": 7.980712166172107e-06, + "loss": 1.0849, + "step": 27720 + }, + { + "epoch": 4.1, + "eval_loss": 1.0640796422958374, + "eval_runtime": 516.6056, + "eval_samples_per_second": 14.787, + "eval_wer": 0.3646473598444781, + "step": 27720 + }, + { + "epoch": 4.1, + "learning_rate": 7.977744807121663e-06, + "loss": 1.0732, + "step": 27760 + }, + { + "epoch": 4.1, + "eval_loss": 1.0664726495742798, + "eval_runtime": 516.7284, + "eval_samples_per_second": 14.783, + "eval_wer": 0.3655336058778124, + "step": 27760 + }, + { + "epoch": 4.11, + "learning_rate": 7.974777448071217e-06, + "loss": 1.0774, + "step": 27800 + }, + { + "epoch": 4.11, + "eval_loss": 1.0448260307312012, + "eval_runtime": 515.9589, + "eval_samples_per_second": 14.805, + "eval_wer": 0.36256039337888446, + "step": 27800 + }, + { + "epoch": 4.12, + "learning_rate": 7.971810089020772e-06, + "loss": 1.1573, + "step": 27840 + }, + { + "epoch": 4.12, + "eval_loss": 0.997246503829956, + "eval_runtime": 515.1986, + "eval_samples_per_second": 14.827, + "eval_wer": 0.3579862203036107, + "step": 27840 + }, + { + "epoch": 4.12, + "learning_rate": 7.968842729970328e-06, + "loss": 1.1299, + "step": 27880 + }, + { + "epoch": 4.12, + "eval_loss": 1.0444852113723755, + "eval_runtime": 515.3873, + "eval_samples_per_second": 14.822, + "eval_wer": 0.3631035764315732, + "step": 27880 + }, + { + "epoch": 4.13, + "learning_rate": 7.965875370919882e-06, + "loss": 1.0772, + "step": 27920 + }, + { + "epoch": 4.13, + "eval_loss": 0.9923107624053955, + "eval_runtime": 515.3931, + "eval_samples_per_second": 14.822, + "eval_wer": 0.35744303725092197, + "step": 27920 + }, + { + "epoch": 4.13, + "learning_rate": 7.962908011869437e-06, + "loss": 1.1101, + "step": 27960 + }, + { + "epoch": 4.13, + "eval_loss": 1.026638388633728, + "eval_runtime": 517.6394, + "eval_samples_per_second": 14.757, + "eval_wer": 0.36010177535092486, + "step": 27960 + }, + { + "epoch": 4.14, + "learning_rate": 7.959940652818991e-06, + "loss": 1.1652, + "step": 28000 + }, + { + "epoch": 4.14, + "eval_loss": 1.0010384321212769, + "eval_runtime": 519.2647, + "eval_samples_per_second": 14.711, + "eval_wer": 0.3587581120100632, + "step": 28000 + }, + { + "epoch": 4.14, + "learning_rate": 7.956973293768546e-06, + "loss": 1.1072, + "step": 28040 + }, + { + "epoch": 4.14, + "eval_loss": 1.011716365814209, + "eval_runtime": 522.0844, + "eval_samples_per_second": 14.632, + "eval_wer": 0.3593584722261929, + "step": 28040 + }, + { + "epoch": 4.15, + "learning_rate": 7.954005934718102e-06, + "loss": 1.1238, + "step": 28080 + }, + { + "epoch": 4.15, + "eval_loss": 0.9536174535751343, + "eval_runtime": 518.0238, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3556133680208125, + "step": 28080 + }, + { + "epoch": 4.16, + "learning_rate": 7.951038575667656e-06, + "loss": 1.1243, + "step": 28120 + }, + { + "epoch": 4.16, + "eval_loss": 1.032930612564087, + "eval_runtime": 520.2997, + "eval_samples_per_second": 14.682, + "eval_wer": 0.3613882615283456, + "step": 28120 + }, + { + "epoch": 4.16, + "learning_rate": 7.94807121661721e-06, + "loss": 1.0864, + "step": 28160 + }, + { + "epoch": 4.16, + "eval_loss": 0.9986640214920044, + "eval_runtime": 517.3061, + "eval_samples_per_second": 14.767, + "eval_wer": 0.3583864604476972, + "step": 28160 + }, + { + "epoch": 4.17, + "learning_rate": 7.945103857566765e-06, + "loss": 1.1517, + "step": 28200 + }, + { + "epoch": 4.17, + "eval_loss": 1.047798752784729, + "eval_runtime": 518.8813, + "eval_samples_per_second": 14.722, + "eval_wer": 0.3634752279939392, + "step": 28200 + }, + { + "epoch": 4.17, + "learning_rate": 7.942136498516321e-06, + "loss": 1.1402, + "step": 28240 + }, + { + "epoch": 4.17, + "eval_loss": 1.0599175691604614, + "eval_runtime": 516.8775, + "eval_samples_per_second": 14.779, + "eval_wer": 0.3641613539552303, + "step": 28240 + }, + { + "epoch": 4.18, + "learning_rate": 7.939169139465876e-06, + "loss": 1.099, + "step": 28280 + }, + { + "epoch": 4.18, + "eval_loss": 0.975063145160675, + "eval_runtime": 517.9477, + "eval_samples_per_second": 14.749, + "eval_wer": 0.3564710254724263, + "step": 28280 + }, + { + "epoch": 4.19, + "learning_rate": 7.936201780415432e-06, + "loss": 1.1013, + "step": 28320 + }, + { + "epoch": 4.19, + "eval_loss": 1.0289757251739502, + "eval_runtime": 518.4483, + "eval_samples_per_second": 14.734, + "eval_wer": 0.3607021355670545, + "step": 28320 + }, + { + "epoch": 4.19, + "learning_rate": 7.933234421364986e-06, + "loss": 1.0779, + "step": 28360 + }, + { + "epoch": 4.19, + "eval_loss": 1.0799386501312256, + "eval_runtime": 518.467, + "eval_samples_per_second": 14.734, + "eval_wer": 0.36484747991652133, + "step": 28360 + }, + { + "epoch": 4.2, + "learning_rate": 7.930267062314541e-06, + "loss": 1.1482, + "step": 28400 + }, + { + "epoch": 4.2, + "eval_loss": 1.001220464706421, + "eval_runtime": 521.9007, + "eval_samples_per_second": 14.637, + "eval_wer": 0.3585865805197404, + "step": 28400 + }, + { + "epoch": 4.2, + "learning_rate": 7.927299703264095e-06, + "loss": 1.0429, + "step": 28440 + }, + { + "epoch": 4.2, + "eval_loss": 1.0270240306854248, + "eval_runtime": 516.9554, + "eval_samples_per_second": 14.777, + "eval_wer": 0.3604734269132908, + "step": 28440 + }, + { + "epoch": 4.21, + "learning_rate": 7.924332344213651e-06, + "loss": 1.1327, + "step": 28480 + }, + { + "epoch": 4.21, + "eval_loss": 1.0136690139770508, + "eval_runtime": 516.6265, + "eval_samples_per_second": 14.786, + "eval_wer": 0.36058778124017266, + "step": 28480 + }, + { + "epoch": 4.22, + "learning_rate": 7.921364985163206e-06, + "loss": 0.9786, + "step": 28520 + }, + { + "epoch": 4.22, + "eval_loss": 1.0316003561019897, + "eval_runtime": 519.2902, + "eval_samples_per_second": 14.71, + "eval_wer": 0.3619028559993139, + "step": 28520 + }, + { + "epoch": 4.22, + "learning_rate": 7.91839762611276e-06, + "loss": 1.1752, + "step": 28560 + }, + { + "epoch": 4.22, + "eval_loss": 0.9914469122886658, + "eval_runtime": 517.3394, + "eval_samples_per_second": 14.766, + "eval_wer": 0.3584436376111381, + "step": 28560 + }, + { + "epoch": 4.23, + "learning_rate": 7.915430267062315e-06, + "loss": 1.0716, + "step": 28600 + }, + { + "epoch": 4.23, + "eval_loss": 1.0116994380950928, + "eval_runtime": 518.2534, + "eval_samples_per_second": 14.74, + "eval_wer": 0.3600445981874839, + "step": 28600 + }, + { + "epoch": 4.23, + "learning_rate": 7.91246290801187e-06, + "loss": 1.1068, + "step": 28640 + }, + { + "epoch": 4.23, + "eval_loss": 1.0334413051605225, + "eval_runtime": 517.4063, + "eval_samples_per_second": 14.764, + "eval_wer": 0.3616741473455502, + "step": 28640 + }, + { + "epoch": 4.24, + "learning_rate": 7.909495548961424e-06, + "loss": 1.1383, + "step": 28680 + }, + { + "epoch": 4.24, + "eval_loss": 1.0094255208969116, + "eval_runtime": 517.665, + "eval_samples_per_second": 14.757, + "eval_wer": 0.3594442379713542, + "step": 28680 + }, + { + "epoch": 4.25, + "learning_rate": 7.90652818991098e-06, + "loss": 1.1254, + "step": 28720 + }, + { + "epoch": 4.25, + "eval_loss": 1.0347013473510742, + "eval_runtime": 516.4491, + "eval_samples_per_second": 14.791, + "eval_wer": 0.3601303639326453, + "step": 28720 + }, + { + "epoch": 4.25, + "learning_rate": 7.903560830860534e-06, + "loss": 1.1439, + "step": 28760 + }, + { + "epoch": 4.25, + "eval_loss": 0.9980185031890869, + "eval_runtime": 516.7521, + "eval_samples_per_second": 14.783, + "eval_wer": 0.3579004545584494, + "step": 28760 + }, + { + "epoch": 4.26, + "learning_rate": 7.90059347181009e-06, + "loss": 1.102, + "step": 28800 + }, + { + "epoch": 4.26, + "eval_loss": 1.0123798847198486, + "eval_runtime": 516.4979, + "eval_samples_per_second": 14.79, + "eval_wer": 0.3587581120100632, + "step": 28800 + }, + { + "epoch": 4.26, + "learning_rate": 7.897626112759645e-06, + "loss": 1.1852, + "step": 28840 + }, + { + "epoch": 4.26, + "eval_loss": 0.9986881017684937, + "eval_runtime": 518.2511, + "eval_samples_per_second": 14.74, + "eval_wer": 0.35804339746705166, + "step": 28840 + }, + { + "epoch": 4.27, + "learning_rate": 7.8946587537092e-06, + "loss": 1.1285, + "step": 28880 + }, + { + "epoch": 4.27, + "eval_loss": 1.0426254272460938, + "eval_runtime": 517.5396, + "eval_samples_per_second": 14.76, + "eval_wer": 0.36053060407673176, + "step": 28880 + }, + { + "epoch": 4.27, + "learning_rate": 7.891691394658755e-06, + "loss": 1.1617, + "step": 28920 + }, + { + "epoch": 4.27, + "eval_loss": 0.9496119022369385, + "eval_runtime": 517.2171, + "eval_samples_per_second": 14.769, + "eval_wer": 0.3553560707853283, + "step": 28920 + }, + { + "epoch": 4.28, + "learning_rate": 7.88872403560831e-06, + "loss": 1.1588, + "step": 28960 + }, + { + "epoch": 4.28, + "eval_loss": 0.9806321263313293, + "eval_runtime": 515.743, + "eval_samples_per_second": 14.812, + "eval_wer": 0.3566425569627491, + "step": 28960 + }, + { + "epoch": 4.29, + "learning_rate": 7.885756676557864e-06, + "loss": 1.1951, + "step": 29000 + }, + { + "epoch": 4.29, + "eval_loss": 0.9549854397773743, + "eval_runtime": 521.1307, + "eval_samples_per_second": 14.659, + "eval_wer": 0.355584779439092, + "step": 29000 + }, + { + "epoch": 4.29, + "learning_rate": 7.882789317507419e-06, + "loss": 1.0964, + "step": 29040 + }, + { + "epoch": 4.29, + "eval_loss": 1.0674152374267578, + "eval_runtime": 517.4999, + "eval_samples_per_second": 14.761, + "eval_wer": 0.3646473598444781, + "step": 29040 + }, + { + "epoch": 4.3, + "learning_rate": 7.879821958456973e-06, + "loss": 1.031, + "step": 29080 + }, + { + "epoch": 4.3, + "eval_loss": 1.0076794624328613, + "eval_runtime": 517.0056, + "eval_samples_per_second": 14.775, + "eval_wer": 0.35967294662511795, + "step": 29080 + }, + { + "epoch": 4.3, + "learning_rate": 7.87685459940653e-06, + "loss": 1.089, + "step": 29120 + }, + { + "epoch": 4.3, + "eval_loss": 1.0496057271957397, + "eval_runtime": 521.1749, + "eval_samples_per_second": 14.657, + "eval_wer": 0.36204579890791616, + "step": 29120 + }, + { + "epoch": 4.31, + "learning_rate": 7.873887240356084e-06, + "loss": 1.1002, + "step": 29160 + }, + { + "epoch": 4.31, + "eval_loss": 1.0502471923828125, + "eval_runtime": 515.8059, + "eval_samples_per_second": 14.81, + "eval_wer": 0.36247462763372307, + "step": 29160 + }, + { + "epoch": 4.32, + "learning_rate": 7.870919881305638e-06, + "loss": 1.1155, + "step": 29200 + }, + { + "epoch": 4.32, + "eval_loss": 1.0315710306167603, + "eval_runtime": 516.5437, + "eval_samples_per_second": 14.789, + "eval_wer": 0.3614454386917865, + "step": 29200 + }, + { + "epoch": 4.32, + "learning_rate": 7.867952522255193e-06, + "loss": 1.1446, + "step": 29240 + }, + { + "epoch": 4.32, + "eval_loss": 0.9778415560722351, + "eval_runtime": 521.6085, + "eval_samples_per_second": 14.645, + "eval_wer": 0.3573572715057606, + "step": 29240 + }, + { + "epoch": 4.33, + "learning_rate": 7.864985163204749e-06, + "loss": 1.1135, + "step": 29280 + }, + { + "epoch": 4.33, + "eval_loss": 1.0328408479690552, + "eval_runtime": 517.1669, + "eval_samples_per_second": 14.771, + "eval_wer": 0.360730724148775, + "step": 29280 + }, + { + "epoch": 4.33, + "learning_rate": 7.862017804154303e-06, + "loss": 1.0609, + "step": 29320 + }, + { + "epoch": 4.33, + "eval_loss": 1.0222322940826416, + "eval_runtime": 516.4114, + "eval_samples_per_second": 14.792, + "eval_wer": 0.3599016552788816, + "step": 29320 + }, + { + "epoch": 4.34, + "learning_rate": 7.85905044510386e-06, + "loss": 1.0595, + "step": 29360 + }, + { + "epoch": 4.34, + "eval_loss": 1.060978889465332, + "eval_runtime": 518.0062, + "eval_samples_per_second": 14.747, + "eval_wer": 0.36256039337888446, + "step": 29360 + }, + { + "epoch": 4.35, + "learning_rate": 7.856083086053414e-06, + "loss": 1.0765, + "step": 29400 + }, + { + "epoch": 4.35, + "eval_loss": 0.9978111386299133, + "eval_runtime": 515.8557, + "eval_samples_per_second": 14.808, + "eval_wer": 0.3573858600874811, + "step": 29400 + }, + { + "epoch": 4.35, + "learning_rate": 7.853115727002968e-06, + "loss": 1.1555, + "step": 29440 + }, + { + "epoch": 4.35, + "eval_loss": 1.0090408325195312, + "eval_runtime": 517.6938, + "eval_samples_per_second": 14.756, + "eval_wer": 0.35864375768318135, + "step": 29440 + }, + { + "epoch": 4.36, + "learning_rate": 7.850148367952523e-06, + "loss": 1.0493, + "step": 29480 + }, + { + "epoch": 4.36, + "eval_loss": 1.030698537826538, + "eval_runtime": 517.465, + "eval_samples_per_second": 14.762, + "eval_wer": 0.35950141513479517, + "step": 29480 + }, + { + "epoch": 4.36, + "learning_rate": 7.847181008902079e-06, + "loss": 1.0423, + "step": 29520 + }, + { + "epoch": 4.36, + "eval_loss": 1.0564556121826172, + "eval_runtime": 516.5388, + "eval_samples_per_second": 14.789, + "eval_wer": 0.3612453186197433, + "step": 29520 + }, + { + "epoch": 4.37, + "learning_rate": 7.844213649851633e-06, + "loss": 1.0956, + "step": 29560 + }, + { + "epoch": 4.37, + "eval_loss": 1.0114264488220215, + "eval_runtime": 517.4486, + "eval_samples_per_second": 14.763, + "eval_wer": 0.35775751164984704, + "step": 29560 + }, + { + "epoch": 4.38, + "learning_rate": 7.841246290801188e-06, + "loss": 1.1461, + "step": 29600 + }, + { + "epoch": 4.38, + "eval_loss": 1.0158805847167969, + "eval_runtime": 516.2548, + "eval_samples_per_second": 14.797, + "eval_wer": 0.35847222619285857, + "step": 29600 + }, + { + "epoch": 4.38, + "learning_rate": 7.838278931750742e-06, + "loss": 1.0789, + "step": 29640 + }, + { + "epoch": 4.38, + "eval_loss": 1.0107299089431763, + "eval_runtime": 520.4911, + "eval_samples_per_second": 14.677, + "eval_wer": 0.3580148088853312, + "step": 29640 + }, + { + "epoch": 4.39, + "learning_rate": 7.835311572700297e-06, + "loss": 1.1028, + "step": 29680 + }, + { + "epoch": 4.39, + "eval_loss": 1.0288488864898682, + "eval_runtime": 518.8712, + "eval_samples_per_second": 14.722, + "eval_wer": 0.359244117899311, + "step": 29680 + }, + { + "epoch": 4.39, + "learning_rate": 7.832344213649851e-06, + "loss": 1.1296, + "step": 29720 + }, + { + "epoch": 4.39, + "eval_loss": 1.0198644399642944, + "eval_runtime": 518.148, + "eval_samples_per_second": 14.743, + "eval_wer": 0.35847222619285857, + "step": 29720 + }, + { + "epoch": 4.4, + "learning_rate": 7.829376854599407e-06, + "loss": 1.1488, + "step": 29760 + }, + { + "epoch": 4.4, + "eval_loss": 0.9756755232810974, + "eval_runtime": 517.0045, + "eval_samples_per_second": 14.775, + "eval_wer": 0.3558420766745762, + "step": 29760 + }, + { + "epoch": 4.4, + "learning_rate": 7.826409495548962e-06, + "loss": 1.1375, + "step": 29800 + }, + { + "epoch": 4.4, + "eval_loss": 0.9799306988716125, + "eval_runtime": 517.1833, + "eval_samples_per_second": 14.77, + "eval_wer": 0.35578489951113523, + "step": 29800 + }, + { + "epoch": 4.41, + "learning_rate": 7.823442136498518e-06, + "loss": 1.1562, + "step": 29840 + }, + { + "epoch": 4.41, + "eval_loss": 0.9705556035041809, + "eval_runtime": 516.846, + "eval_samples_per_second": 14.78, + "eval_wer": 0.35512736213156465, + "step": 29840 + }, + { + "epoch": 4.42, + "learning_rate": 7.820474777448072e-06, + "loss": 1.1221, + "step": 29880 + }, + { + "epoch": 4.42, + "eval_loss": 1.0063995122909546, + "eval_runtime": 517.4176, + "eval_samples_per_second": 14.764, + "eval_wer": 0.357814688813288, + "step": 29880 + }, + { + "epoch": 4.42, + "learning_rate": 7.817507418397627e-06, + "loss": 1.0836, + "step": 29920 + }, + { + "epoch": 4.42, + "eval_loss": 1.0277222394943237, + "eval_runtime": 518.0562, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3592727064810315, + "step": 29920 + }, + { + "epoch": 4.43, + "learning_rate": 7.814540059347183e-06, + "loss": 1.0175, + "step": 29960 + }, + { + "epoch": 4.43, + "eval_loss": 1.0113905668258667, + "eval_runtime": 517.4431, + "eval_samples_per_second": 14.763, + "eval_wer": 0.357071385688556, + "step": 29960 + }, + { + "epoch": 4.43, + "learning_rate": 7.811572700296737e-06, + "loss": 1.0851, + "step": 30000 + }, + { + "epoch": 4.43, + "eval_loss": 1.0244808197021484, + "eval_runtime": 516.1022, + "eval_samples_per_second": 14.801, + "eval_wer": 0.35795763172189027, + "step": 30000 + }, + { + "epoch": 4.44, + "learning_rate": 7.808605341246292e-06, + "loss": 1.0833, + "step": 30040 + }, + { + "epoch": 4.44, + "eval_loss": 0.999613344669342, + "eval_runtime": 516.4423, + "eval_samples_per_second": 14.792, + "eval_wer": 0.35581348809285573, + "step": 30040 + }, + { + "epoch": 4.45, + "learning_rate": 7.805637982195846e-06, + "loss": 1.0666, + "step": 30080 + }, + { + "epoch": 4.45, + "eval_loss": 1.0297757387161255, + "eval_runtime": 517.3575, + "eval_samples_per_second": 14.765, + "eval_wer": 0.3593298836444724, + "step": 30080 + }, + { + "epoch": 4.45, + "learning_rate": 7.8026706231454e-06, + "loss": 1.0936, + "step": 30120 + }, + { + "epoch": 4.45, + "eval_loss": 1.003629446029663, + "eval_runtime": 516.1094, + "eval_samples_per_second": 14.801, + "eval_wer": 0.3574144486692015, + "step": 30120 + }, + { + "epoch": 4.46, + "learning_rate": 7.799703264094957e-06, + "loss": 0.9889, + "step": 30160 + }, + { + "epoch": 4.46, + "eval_loss": 1.0651980638504028, + "eval_runtime": 517.6137, + "eval_samples_per_second": 14.758, + "eval_wer": 0.36187426741759343, + "step": 30160 + }, + { + "epoch": 4.46, + "learning_rate": 7.796735905044511e-06, + "loss": 1.1972, + "step": 30200 + }, + { + "epoch": 4.46, + "eval_loss": 0.9757182002067566, + "eval_runtime": 517.414, + "eval_samples_per_second": 14.764, + "eval_wer": 0.35409817318962805, + "step": 30200 + }, + { + "epoch": 4.47, + "learning_rate": 7.793768545994066e-06, + "loss": 1.0669, + "step": 30240 + }, + { + "epoch": 4.47, + "eval_loss": 1.0498521327972412, + "eval_runtime": 516.6179, + "eval_samples_per_second": 14.787, + "eval_wer": 0.3599588324423225, + "step": 30240 + }, + { + "epoch": 4.48, + "learning_rate": 7.79080118694362e-06, + "loss": 1.1443, + "step": 30280 + }, + { + "epoch": 4.48, + "eval_loss": 1.0508592128753662, + "eval_runtime": 517.5374, + "eval_samples_per_second": 14.76, + "eval_wer": 0.3608164898939364, + "step": 30280 + }, + { + "epoch": 4.48, + "learning_rate": 7.787833827893176e-06, + "loss": 1.0988, + "step": 30320 + }, + { + "epoch": 4.48, + "eval_loss": 1.0634363889694214, + "eval_runtime": 517.233, + "eval_samples_per_second": 14.769, + "eval_wer": 0.3622745075616799, + "step": 30320 + }, + { + "epoch": 4.49, + "learning_rate": 7.78486646884273e-06, + "loss": 1.0449, + "step": 30360 + }, + { + "epoch": 4.49, + "eval_loss": 1.023804783821106, + "eval_runtime": 517.0027, + "eval_samples_per_second": 14.776, + "eval_wer": 0.3590154092455473, + "step": 30360 + }, + { + "epoch": 4.49, + "learning_rate": 7.781899109792285e-06, + "loss": 1.0463, + "step": 30400 + }, + { + "epoch": 4.49, + "eval_loss": 1.0637210607528687, + "eval_runtime": 517.9872, + "eval_samples_per_second": 14.747, + "eval_wer": 0.36258898196060496, + "step": 30400 + }, + { + "epoch": 4.5, + "learning_rate": 7.778931750741841e-06, + "loss": 1.1166, + "step": 30440 + }, + { + "epoch": 4.5, + "eval_loss": 1.0437933206558228, + "eval_runtime": 516.9748, + "eval_samples_per_second": 14.776, + "eval_wer": 0.36033048400468853, + "step": 30440 + }, + { + "epoch": 4.51, + "learning_rate": 7.775964391691396e-06, + "loss": 1.0791, + "step": 30480 + }, + { + "epoch": 4.51, + "eval_loss": 1.0555959939956665, + "eval_runtime": 518.0493, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3613024957831842, + "step": 30480 + }, + { + "epoch": 4.51, + "learning_rate": 7.77299703264095e-06, + "loss": 1.1144, + "step": 30520 + }, + { + "epoch": 4.51, + "eval_loss": 0.9781954884529114, + "eval_runtime": 517.2771, + "eval_samples_per_second": 14.768, + "eval_wer": 0.3538694645358644, + "step": 30520 + }, + { + "epoch": 4.52, + "learning_rate": 7.770029673590506e-06, + "loss": 1.173, + "step": 30560 + }, + { + "epoch": 4.52, + "eval_loss": 1.0083729028701782, + "eval_runtime": 517.959, + "eval_samples_per_second": 14.748, + "eval_wer": 0.35644243689070587, + "step": 30560 + }, + { + "epoch": 4.52, + "learning_rate": 7.76706231454006e-06, + "loss": 1.0592, + "step": 30600 + }, + { + "epoch": 4.52, + "eval_loss": 1.0010157823562622, + "eval_runtime": 517.3242, + "eval_samples_per_second": 14.766, + "eval_wer": 0.3560421967466194, + "step": 30600 + }, + { + "epoch": 4.53, + "learning_rate": 7.764094955489615e-06, + "loss": 1.1112, + "step": 30640 + }, + { + "epoch": 4.53, + "eval_loss": 0.9720462560653687, + "eval_runtime": 516.3134, + "eval_samples_per_second": 14.795, + "eval_wer": 0.3535549901369393, + "step": 30640 + }, + { + "epoch": 4.54, + "learning_rate": 7.76112759643917e-06, + "loss": 1.1414, + "step": 30680 + }, + { + "epoch": 4.54, + "eval_loss": 1.0112695693969727, + "eval_runtime": 515.9933, + "eval_samples_per_second": 14.804, + "eval_wer": 0.3561279624917808, + "step": 30680 + }, + { + "epoch": 4.54, + "learning_rate": 7.758160237388724e-06, + "loss": 1.1854, + "step": 30720 + }, + { + "epoch": 4.54, + "eval_loss": 0.9933329820632935, + "eval_runtime": 517.1947, + "eval_samples_per_second": 14.77, + "eval_wer": 0.35572772234769434, + "step": 30720 + }, + { + "epoch": 4.55, + "learning_rate": 7.755192878338278e-06, + "loss": 1.1359, + "step": 30760 + }, + { + "epoch": 4.55, + "eval_loss": 1.0201855897903442, + "eval_runtime": 516.2947, + "eval_samples_per_second": 14.796, + "eval_wer": 0.3579862203036107, + "step": 30760 + }, + { + "epoch": 4.55, + "learning_rate": 7.752225519287835e-06, + "loss": 1.1696, + "step": 30800 + }, + { + "epoch": 4.55, + "eval_loss": 1.034751534461975, + "eval_runtime": 516.8508, + "eval_samples_per_second": 14.78, + "eval_wer": 0.3597015352068384, + "step": 30800 + }, + { + "epoch": 4.56, + "learning_rate": 7.749258160237389e-06, + "loss": 1.0976, + "step": 30840 + }, + { + "epoch": 4.56, + "eval_loss": 1.0100444555282593, + "eval_runtime": 517.8818, + "eval_samples_per_second": 14.75, + "eval_wer": 0.3572143285971583, + "step": 30840 + }, + { + "epoch": 4.56, + "learning_rate": 7.746290801186943e-06, + "loss": 1.0788, + "step": 30880 + }, + { + "epoch": 4.56, + "eval_loss": 1.0287071466445923, + "eval_runtime": 516.2731, + "eval_samples_per_second": 14.796, + "eval_wer": 0.3583864604476972, + "step": 30880 + }, + { + "epoch": 4.57, + "learning_rate": 7.7433234421365e-06, + "loss": 1.0529, + "step": 30920 + }, + { + "epoch": 4.57, + "eval_loss": 1.0133593082427979, + "eval_runtime": 517.7416, + "eval_samples_per_second": 14.754, + "eval_wer": 0.35692844277995367, + "step": 30920 + }, + { + "epoch": 4.58, + "learning_rate": 7.740356083086054e-06, + "loss": 1.0638, + "step": 30960 + }, + { + "epoch": 4.58, + "eval_loss": 0.9609493613243103, + "eval_runtime": 519.5329, + "eval_samples_per_second": 14.704, + "eval_wer": 0.35361216730038025, + "step": 30960 + }, + { + "epoch": 4.58, + "learning_rate": 7.73738872403561e-06, + "loss": 1.0681, + "step": 31000 + }, + { + "epoch": 4.58, + "eval_loss": 1.0388981103897095, + "eval_runtime": 518.2567, + "eval_samples_per_second": 14.74, + "eval_wer": 0.35967294662511795, + "step": 31000 + }, + { + "epoch": 4.59, + "learning_rate": 7.734421364985165e-06, + "loss": 1.0955, + "step": 31040 + }, + { + "epoch": 4.59, + "eval_loss": 1.0028871297836304, + "eval_runtime": 518.0873, + "eval_samples_per_second": 14.745, + "eval_wer": 0.3566139683810286, + "step": 31040 + }, + { + "epoch": 4.59, + "learning_rate": 7.731454005934719e-06, + "loss": 1.1033, + "step": 31080 + }, + { + "epoch": 4.59, + "eval_loss": 0.999845564365387, + "eval_runtime": 517.9017, + "eval_samples_per_second": 14.75, + "eval_wer": 0.35607078532833986, + "step": 31080 + }, + { + "epoch": 4.6, + "learning_rate": 7.728486646884273e-06, + "loss": 1.067, + "step": 31120 + }, + { + "epoch": 4.6, + "eval_loss": 0.9884674549102783, + "eval_runtime": 517.6541, + "eval_samples_per_second": 14.757, + "eval_wer": 0.3551559507132851, + "step": 31120 + }, + { + "epoch": 4.61, + "learning_rate": 7.725519287833828e-06, + "loss": 1.0986, + "step": 31160 + }, + { + "epoch": 4.61, + "eval_loss": 1.0283485651016235, + "eval_runtime": 522.1804, + "eval_samples_per_second": 14.629, + "eval_wer": 0.35761456874124475, + "step": 31160 + }, + { + "epoch": 4.61, + "learning_rate": 7.722551928783384e-06, + "loss": 1.0534, + "step": 31200 + }, + { + "epoch": 4.61, + "eval_loss": 1.0018260478973389, + "eval_runtime": 516.4671, + "eval_samples_per_second": 14.791, + "eval_wer": 0.3552417164584465, + "step": 31200 + }, + { + "epoch": 4.62, + "learning_rate": 7.719584569732938e-06, + "loss": 1.0948, + "step": 31240 + }, + { + "epoch": 4.62, + "eval_loss": 0.9848181009292603, + "eval_runtime": 517.7057, + "eval_samples_per_second": 14.755, + "eval_wer": 0.3544126475885531, + "step": 31240 + }, + { + "epoch": 4.62, + "learning_rate": 7.716617210682493e-06, + "loss": 1.1177, + "step": 31280 + }, + { + "epoch": 4.62, + "eval_loss": 1.0045942068099976, + "eval_runtime": 521.9703, + "eval_samples_per_second": 14.635, + "eval_wer": 0.3558420766745762, + "step": 31280 + }, + { + "epoch": 4.63, + "learning_rate": 7.713649851632047e-06, + "loss": 1.0985, + "step": 31320 + }, + { + "epoch": 4.63, + "eval_loss": 0.9957672357559204, + "eval_runtime": 518.2546, + "eval_samples_per_second": 14.74, + "eval_wer": 0.3554132479487693, + "step": 31320 + }, + { + "epoch": 4.64, + "learning_rate": 7.710682492581602e-06, + "loss": 1.0716, + "step": 31360 + }, + { + "epoch": 4.64, + "eval_loss": 1.011922001838684, + "eval_runtime": 516.4244, + "eval_samples_per_second": 14.792, + "eval_wer": 0.3556991337659739, + "step": 31360 + }, + { + "epoch": 4.64, + "learning_rate": 7.707715133531158e-06, + "loss": 1.2422, + "step": 31400 + }, + { + "epoch": 4.64, + "eval_loss": 0.9752572774887085, + "eval_runtime": 521.3156, + "eval_samples_per_second": 14.653, + "eval_wer": 0.3537265216272621, + "step": 31400 + }, + { + "epoch": 4.65, + "learning_rate": 7.704747774480712e-06, + "loss": 1.1284, + "step": 31440 + }, + { + "epoch": 4.65, + "eval_loss": 1.0148875713348389, + "eval_runtime": 517.0206, + "eval_samples_per_second": 14.775, + "eval_wer": 0.3561279624917808, + "step": 31440 + }, + { + "epoch": 4.65, + "learning_rate": 7.701780415430268e-06, + "loss": 1.0564, + "step": 31480 + }, + { + "epoch": 4.65, + "eval_loss": 1.0123984813690186, + "eval_runtime": 517.5035, + "eval_samples_per_second": 14.761, + "eval_wer": 0.3557563109294148, + "step": 31480 + }, + { + "epoch": 4.66, + "learning_rate": 7.698813056379823e-06, + "loss": 1.1313, + "step": 31520 + }, + { + "epoch": 4.66, + "eval_loss": 1.0213305950164795, + "eval_runtime": 520.4882, + "eval_samples_per_second": 14.677, + "eval_wer": 0.35641384830898537, + "step": 31520 + }, + { + "epoch": 4.67, + "learning_rate": 7.695845697329377e-06, + "loss": 1.0557, + "step": 31560 + }, + { + "epoch": 4.67, + "eval_loss": 1.0263334512710571, + "eval_runtime": 517.9444, + "eval_samples_per_second": 14.749, + "eval_wer": 0.35644243689070587, + "step": 31560 + }, + { + "epoch": 4.67, + "learning_rate": 7.692878338278934e-06, + "loss": 1.1172, + "step": 31600 + }, + { + "epoch": 4.67, + "eval_loss": 0.9623167514801025, + "eval_runtime": 517.1379, + "eval_samples_per_second": 14.772, + "eval_wer": 0.3527545098487664, + "step": 31600 + }, + { + "epoch": 4.68, + "learning_rate": 7.689910979228488e-06, + "loss": 1.0795, + "step": 31640 + }, + { + "epoch": 4.68, + "eval_loss": 1.003406047821045, + "eval_runtime": 521.2625, + "eval_samples_per_second": 14.655, + "eval_wer": 0.35446982475199407, + "step": 31640 + }, + { + "epoch": 4.68, + "learning_rate": 7.686943620178042e-06, + "loss": 1.0872, + "step": 31680 + }, + { + "epoch": 4.68, + "eval_loss": 0.9968051314353943, + "eval_runtime": 516.0246, + "eval_samples_per_second": 14.804, + "eval_wer": 0.354155350353069, + "step": 31680 + }, + { + "epoch": 4.69, + "learning_rate": 7.683976261127597e-06, + "loss": 1.1128, + "step": 31720 + }, + { + "epoch": 4.69, + "eval_loss": 0.9959412217140198, + "eval_runtime": 515.9306, + "eval_samples_per_second": 14.806, + "eval_wer": 0.353783698790703, + "step": 31720 + }, + { + "epoch": 4.69, + "learning_rate": 7.681008902077151e-06, + "loss": 1.1043, + "step": 31760 + }, + { + "epoch": 4.69, + "eval_loss": 1.0409866571426392, + "eval_runtime": 522.1248, + "eval_samples_per_second": 14.631, + "eval_wer": 0.3567854998713514, + "step": 31760 + }, + { + "epoch": 4.7, + "learning_rate": 7.678041543026706e-06, + "loss": 1.0141, + "step": 31800 + }, + { + "epoch": 4.7, + "eval_loss": 1.1120960712432861, + "eval_runtime": 516.1145, + "eval_samples_per_second": 14.801, + "eval_wer": 0.363275107921896, + "step": 31800 + }, + { + "epoch": 4.71, + "learning_rate": 7.675074183976262e-06, + "loss": 1.0606, + "step": 31840 + }, + { + "epoch": 4.71, + "eval_loss": 0.9807072877883911, + "eval_runtime": 516.6487, + "eval_samples_per_second": 14.786, + "eval_wer": 0.3536407558821007, + "step": 31840 + }, + { + "epoch": 4.71, + "learning_rate": 7.672106824925816e-06, + "loss": 1.0384, + "step": 31880 + }, + { + "epoch": 4.71, + "eval_loss": 1.019762396812439, + "eval_runtime": 516.6847, + "eval_samples_per_second": 14.785, + "eval_wer": 0.35549901369393067, + "step": 31880 + }, + { + "epoch": 4.72, + "learning_rate": 7.66913946587537e-06, + "loss": 1.2044, + "step": 31920 + }, + { + "epoch": 4.72, + "eval_loss": 1.0829719305038452, + "eval_runtime": 516.4036, + "eval_samples_per_second": 14.793, + "eval_wer": 0.3601303639326453, + "step": 31920 + }, + { + "epoch": 4.72, + "learning_rate": 7.666172106824927e-06, + "loss": 1.1003, + "step": 31960 + }, + { + "epoch": 4.72, + "eval_loss": 1.0458056926727295, + "eval_runtime": 517.1295, + "eval_samples_per_second": 14.772, + "eval_wer": 0.35632808256382403, + "step": 31960 + }, + { + "epoch": 4.73, + "learning_rate": 7.663204747774481e-06, + "loss": 1.0583, + "step": 32000 + }, + { + "epoch": 4.73, + "eval_loss": 1.0052728652954102, + "eval_runtime": 518.4158, + "eval_samples_per_second": 14.735, + "eval_wer": 0.3544126475885531, + "step": 32000 + }, + { + "epoch": 4.74, + "learning_rate": 7.660237388724037e-06, + "loss": 1.1035, + "step": 32040 + }, + { + "epoch": 4.74, + "eval_loss": 1.0495153665542603, + "eval_runtime": 519.1761, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3577289230681266, + "step": 32040 + }, + { + "epoch": 4.74, + "learning_rate": 7.657270029673592e-06, + "loss": 1.0275, + "step": 32080 + }, + { + "epoch": 4.74, + "eval_loss": 1.0074541568756104, + "eval_runtime": 517.7065, + "eval_samples_per_second": 14.755, + "eval_wer": 0.35478429915091914, + "step": 32080 + }, + { + "epoch": 4.75, + "learning_rate": 7.654302670623146e-06, + "loss": 1.0965, + "step": 32120 + }, + { + "epoch": 4.75, + "eval_loss": 0.99263596534729, + "eval_runtime": 522.7703, + "eval_samples_per_second": 14.613, + "eval_wer": 0.35358357871865975, + "step": 32120 + }, + { + "epoch": 4.75, + "learning_rate": 7.6513353115727e-06, + "loss": 1.1279, + "step": 32160 + }, + { + "epoch": 4.75, + "eval_loss": 1.0111048221588135, + "eval_runtime": 517.1651, + "eval_samples_per_second": 14.771, + "eval_wer": 0.35644243689070587, + "step": 32160 + }, + { + "epoch": 4.76, + "learning_rate": 7.648367952522255e-06, + "loss": 1.1032, + "step": 32200 + }, + { + "epoch": 4.76, + "eval_loss": 0.9560060501098633, + "eval_runtime": 516.6076, + "eval_samples_per_second": 14.787, + "eval_wer": 0.3513250807627434, + "step": 32200 + }, + { + "epoch": 4.77, + "learning_rate": 7.645400593471811e-06, + "loss": 1.0675, + "step": 32240 + }, + { + "epoch": 4.77, + "eval_loss": 1.024018406867981, + "eval_runtime": 520.9914, + "eval_samples_per_second": 14.662, + "eval_wer": 0.357071385688556, + "step": 32240 + }, + { + "epoch": 4.77, + "learning_rate": 7.642433234421366e-06, + "loss": 1.0407, + "step": 32280 + }, + { + "epoch": 4.77, + "eval_loss": 1.0275917053222656, + "eval_runtime": 519.3263, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3573000943423197, + "step": 32280 + }, + { + "epoch": 4.78, + "learning_rate": 7.63946587537092e-06, + "loss": 0.9898, + "step": 32320 + }, + { + "epoch": 4.78, + "eval_loss": 1.044189691543579, + "eval_runtime": 516.1462, + "eval_samples_per_second": 14.8, + "eval_wer": 0.35747162583264247, + "step": 32320 + }, + { + "epoch": 4.78, + "learning_rate": 7.636498516320475e-06, + "loss": 1.1029, + "step": 32360 + }, + { + "epoch": 4.78, + "eval_loss": 0.9918689131736755, + "eval_runtime": 516.9885, + "eval_samples_per_second": 14.776, + "eval_wer": 0.35366934446382114, + "step": 32360 + }, + { + "epoch": 4.79, + "learning_rate": 7.633531157270029e-06, + "loss": 1.0675, + "step": 32400 + }, + { + "epoch": 4.79, + "eval_loss": 1.0255684852600098, + "eval_runtime": 517.1673, + "eval_samples_per_second": 14.771, + "eval_wer": 0.35581348809285573, + "step": 32400 + }, + { + "epoch": 4.8, + "learning_rate": 7.630563798219585e-06, + "loss": 1.1733, + "step": 32440 + }, + { + "epoch": 4.8, + "eval_loss": 0.970380961894989, + "eval_runtime": 520.4114, + "eval_samples_per_second": 14.679, + "eval_wer": 0.3517253209068298, + "step": 32440 + }, + { + "epoch": 4.8, + "learning_rate": 7.6275964391691406e-06, + "loss": 1.0692, + "step": 32480 + }, + { + "epoch": 4.8, + "eval_loss": 0.9946648478507996, + "eval_runtime": 516.9027, + "eval_samples_per_second": 14.778, + "eval_wer": 0.35361216730038025, + "step": 32480 + }, + { + "epoch": 4.81, + "learning_rate": 7.624629080118695e-06, + "loss": 1.0652, + "step": 32520 + }, + { + "epoch": 4.81, + "eval_loss": 1.0429116487503052, + "eval_runtime": 516.8294, + "eval_samples_per_second": 14.781, + "eval_wer": 0.3579004545584494, + "step": 32520 + }, + { + "epoch": 4.81, + "learning_rate": 7.6216617210682494e-06, + "loss": 1.0722, + "step": 32560 + }, + { + "epoch": 4.81, + "eval_loss": 1.0226349830627441, + "eval_runtime": 520.1421, + "eval_samples_per_second": 14.686, + "eval_wer": 0.35621372823694214, + "step": 32560 + }, + { + "epoch": 4.82, + "learning_rate": 7.618694362017805e-06, + "loss": 1.001, + "step": 32600 + }, + { + "epoch": 4.82, + "eval_loss": 1.0740878582000732, + "eval_runtime": 517.9331, + "eval_samples_per_second": 14.749, + "eval_wer": 0.3607879013122159, + "step": 32600 + }, + { + "epoch": 4.82, + "learning_rate": 7.61572700296736e-06, + "loss": 1.1227, + "step": 32640 + }, + { + "epoch": 4.82, + "eval_loss": 1.0097804069519043, + "eval_runtime": 517.3761, + "eval_samples_per_second": 14.765, + "eval_wer": 0.35504159638640326, + "step": 32640 + }, + { + "epoch": 4.83, + "learning_rate": 7.612759643916915e-06, + "loss": 1.0728, + "step": 32680 + }, + { + "epoch": 4.83, + "eval_loss": 0.9862077236175537, + "eval_runtime": 517.4943, + "eval_samples_per_second": 14.762, + "eval_wer": 0.35281168701220733, + "step": 32680 + }, + { + "epoch": 4.84, + "learning_rate": 7.60979228486647e-06, + "loss": 1.1092, + "step": 32720 + }, + { + "epoch": 4.84, + "eval_loss": 1.0823612213134766, + "eval_runtime": 518.0224, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3615883816003888, + "step": 32720 + }, + { + "epoch": 4.84, + "learning_rate": 7.606824925816024e-06, + "loss": 1.0822, + "step": 32760 + }, + { + "epoch": 4.84, + "eval_loss": 0.9846158623695374, + "eval_runtime": 517.9357, + "eval_samples_per_second": 14.749, + "eval_wer": 0.3528688641756482, + "step": 32760 + }, + { + "epoch": 4.85, + "learning_rate": 7.603857566765579e-06, + "loss": 1.1381, + "step": 32800 + }, + { + "epoch": 4.85, + "eval_loss": 1.0149192810058594, + "eval_runtime": 517.6612, + "eval_samples_per_second": 14.757, + "eval_wer": 0.35512736213156465, + "step": 32800 + }, + { + "epoch": 4.85, + "learning_rate": 7.600890207715134e-06, + "loss": 1.0117, + "step": 32840 + }, + { + "epoch": 4.85, + "eval_loss": 1.0800724029541016, + "eval_runtime": 517.5275, + "eval_samples_per_second": 14.761, + "eval_wer": 0.36155979301866836, + "step": 32840 + }, + { + "epoch": 4.86, + "learning_rate": 7.597922848664689e-06, + "loss": 1.0319, + "step": 32880 + }, + { + "epoch": 4.86, + "eval_loss": 1.0422158241271973, + "eval_runtime": 517.6273, + "eval_samples_per_second": 14.758, + "eval_wer": 0.3573858600874811, + "step": 32880 + }, + { + "epoch": 4.87, + "learning_rate": 7.5949554896142445e-06, + "loss": 1.1061, + "step": 32920 + }, + { + "epoch": 4.87, + "eval_loss": 1.017138957977295, + "eval_runtime": 518.306, + "eval_samples_per_second": 14.738, + "eval_wer": 0.35549901369393067, + "step": 32920 + }, + { + "epoch": 4.87, + "learning_rate": 7.591988130563799e-06, + "loss": 1.1504, + "step": 32960 + }, + { + "epoch": 4.87, + "eval_loss": 1.0248948335647583, + "eval_runtime": 517.9325, + "eval_samples_per_second": 14.749, + "eval_wer": 0.3558420766745762, + "step": 32960 + }, + { + "epoch": 4.88, + "learning_rate": 7.589020771513353e-06, + "loss": 1.057, + "step": 33000 + }, + { + "epoch": 4.88, + "eval_loss": 1.0437135696411133, + "eval_runtime": 519.0945, + "eval_samples_per_second": 14.716, + "eval_wer": 0.35747162583264247, + "step": 33000 + }, + { + "epoch": 4.88, + "learning_rate": 7.586053412462908e-06, + "loss": 1.088, + "step": 33040 + }, + { + "epoch": 4.88, + "eval_loss": 1.0432084798812866, + "eval_runtime": 517.2327, + "eval_samples_per_second": 14.769, + "eval_wer": 0.3567854998713514, + "step": 33040 + }, + { + "epoch": 4.89, + "learning_rate": 7.583086053412464e-06, + "loss": 1.0902, + "step": 33080 + }, + { + "epoch": 4.89, + "eval_loss": 1.0100305080413818, + "eval_runtime": 518.3354, + "eval_samples_per_second": 14.738, + "eval_wer": 0.3537265216272621, + "step": 33080 + }, + { + "epoch": 4.9, + "learning_rate": 7.580118694362018e-06, + "loss": 1.0758, + "step": 33120 + }, + { + "epoch": 4.9, + "eval_loss": 1.0062891244888306, + "eval_runtime": 518.7138, + "eval_samples_per_second": 14.727, + "eval_wer": 0.353783698790703, + "step": 33120 + }, + { + "epoch": 4.9, + "learning_rate": 7.577151335311574e-06, + "loss": 1.065, + "step": 33160 + }, + { + "epoch": 4.9, + "eval_loss": 0.9820078611373901, + "eval_runtime": 517.8333, + "eval_samples_per_second": 14.752, + "eval_wer": 0.3518682638154321, + "step": 33160 + }, + { + "epoch": 4.91, + "learning_rate": 7.574183976261128e-06, + "loss": 1.1387, + "step": 33200 + }, + { + "epoch": 4.91, + "eval_loss": 0.9775822758674622, + "eval_runtime": 517.6635, + "eval_samples_per_second": 14.757, + "eval_wer": 0.3514108465079047, + "step": 33200 + }, + { + "epoch": 4.91, + "learning_rate": 7.5712166172106826e-06, + "loss": 1.0457, + "step": 33240 + }, + { + "epoch": 4.91, + "eval_loss": 0.9870054125785828, + "eval_runtime": 517.176, + "eval_samples_per_second": 14.771, + "eval_wer": 0.35198261814231396, + "step": 33240 + }, + { + "epoch": 4.92, + "learning_rate": 7.568249258160239e-06, + "loss": 1.0943, + "step": 33280 + }, + { + "epoch": 4.92, + "eval_loss": 0.9566874504089355, + "eval_runtime": 518.2338, + "eval_samples_per_second": 14.74, + "eval_wer": 0.349381057205752, + "step": 33280 + }, + { + "epoch": 4.93, + "learning_rate": 7.565281899109793e-06, + "loss": 1.0756, + "step": 33320 + }, + { + "epoch": 4.93, + "eval_loss": 0.9976547956466675, + "eval_runtime": 517.1373, + "eval_samples_per_second": 14.772, + "eval_wer": 0.3532976929014552, + "step": 33320 + }, + { + "epoch": 4.93, + "learning_rate": 7.562314540059348e-06, + "loss": 1.0348, + "step": 33360 + }, + { + "epoch": 4.93, + "eval_loss": 1.0422464609146118, + "eval_runtime": 517.7359, + "eval_samples_per_second": 14.755, + "eval_wer": 0.3556133680208125, + "step": 33360 + }, + { + "epoch": 4.94, + "learning_rate": 7.559347181008903e-06, + "loss": 1.0744, + "step": 33400 + }, + { + "epoch": 4.94, + "eval_loss": 1.0295886993408203, + "eval_runtime": 517.5984, + "eval_samples_per_second": 14.759, + "eval_wer": 0.3558706652562966, + "step": 33400 + }, + { + "epoch": 4.94, + "learning_rate": 7.556379821958457e-06, + "loss": 1.1133, + "step": 33440 + }, + { + "epoch": 4.94, + "eval_loss": 0.9958652853965759, + "eval_runtime": 517.8939, + "eval_samples_per_second": 14.75, + "eval_wer": 0.35344063581005747, + "step": 33440 + }, + { + "epoch": 4.95, + "learning_rate": 7.553412462908013e-06, + "loss": 1.0646, + "step": 33480 + }, + { + "epoch": 4.95, + "eval_loss": 1.0233595371246338, + "eval_runtime": 518.8293, + "eval_samples_per_second": 14.724, + "eval_wer": 0.3547271219874782, + "step": 33480 + }, + { + "epoch": 4.95, + "learning_rate": 7.550445103857568e-06, + "loss": 1.0448, + "step": 33520 + }, + { + "epoch": 4.95, + "eval_loss": 1.0116307735443115, + "eval_runtime": 519.0116, + "eval_samples_per_second": 14.718, + "eval_wer": 0.354898653477801, + "step": 33520 + }, + { + "epoch": 4.96, + "learning_rate": 7.547477744807122e-06, + "loss": 1.0756, + "step": 33560 + }, + { + "epoch": 4.96, + "eval_loss": 1.0275923013687134, + "eval_runtime": 518.9864, + "eval_samples_per_second": 14.719, + "eval_wer": 0.3559278424197376, + "step": 33560 + }, + { + "epoch": 4.97, + "learning_rate": 7.544510385756677e-06, + "loss": 0.9846, + "step": 33600 + }, + { + "epoch": 4.97, + "eval_loss": 1.0057480335235596, + "eval_runtime": 518.0869, + "eval_samples_per_second": 14.745, + "eval_wer": 0.35418393893478944, + "step": 33600 + }, + { + "epoch": 4.97, + "learning_rate": 7.541543026706232e-06, + "loss": 1.0951, + "step": 33640 + }, + { + "epoch": 4.97, + "eval_loss": 0.9959642887115479, + "eval_runtime": 518.4246, + "eval_samples_per_second": 14.735, + "eval_wer": 0.35332628148317563, + "step": 33640 + }, + { + "epoch": 4.98, + "learning_rate": 7.538575667655787e-06, + "loss": 1.129, + "step": 33680 + }, + { + "epoch": 4.98, + "eval_loss": 1.0451074838638306, + "eval_runtime": 522.6829, + "eval_samples_per_second": 14.615, + "eval_wer": 0.35767174590468565, + "step": 33680 + }, + { + "epoch": 4.98, + "learning_rate": 7.535608308605342e-06, + "loss": 1.0386, + "step": 33720 + }, + { + "epoch": 4.98, + "eval_loss": 1.000087022781372, + "eval_runtime": 517.6784, + "eval_samples_per_second": 14.756, + "eval_wer": 0.35455559049715546, + "step": 33720 + }, + { + "epoch": 4.99, + "learning_rate": 7.532640949554897e-06, + "loss": 1.0854, + "step": 33760 + }, + { + "epoch": 4.99, + "eval_loss": 0.9991193413734436, + "eval_runtime": 518.3399, + "eval_samples_per_second": 14.737, + "eval_wer": 0.35475571056919863, + "step": 33760 + }, + { + "epoch": 5.0, + "learning_rate": 7.5296735905044515e-06, + "loss": 1.0553, + "step": 33800 + }, + { + "epoch": 5.0, + "eval_loss": 0.9953956007957458, + "eval_runtime": 521.9143, + "eval_samples_per_second": 14.637, + "eval_wer": 0.35469853340575774, + "step": 33800 + }, + { + "epoch": 5.0, + "learning_rate": 7.526706231454006e-06, + "loss": 1.1396, + "step": 33840 + }, + { + "epoch": 5.0, + "eval_loss": 0.941692590713501, + "eval_runtime": 515.6812, + "eval_samples_per_second": 14.813, + "eval_wer": 0.35103919494553876, + "step": 33840 + }, + { + "epoch": 5.01, + "learning_rate": 7.523738872403561e-06, + "loss": 1.1217, + "step": 33880 + }, + { + "epoch": 5.01, + "eval_loss": 0.9842426180839539, + "eval_runtime": 517.1135, + "eval_samples_per_second": 14.772, + "eval_wer": 0.3522399153777981, + "step": 33880 + }, + { + "epoch": 5.01, + "learning_rate": 7.5207715133531166e-06, + "loss": 1.0758, + "step": 33920 + }, + { + "epoch": 5.01, + "eval_loss": 0.9906590580940247, + "eval_runtime": 516.8193, + "eval_samples_per_second": 14.781, + "eval_wer": 0.35161096657994795, + "step": 33920 + }, + { + "epoch": 5.02, + "learning_rate": 7.517804154302671e-06, + "loss": 1.1043, + "step": 33960 + }, + { + "epoch": 5.02, + "eval_loss": 0.9971727132797241, + "eval_runtime": 517.3842, + "eval_samples_per_second": 14.765, + "eval_wer": 0.3522399153777981, + "step": 33960 + }, + { + "epoch": 5.03, + "learning_rate": 7.514836795252226e-06, + "loss": 0.9899, + "step": 34000 + }, + { + "epoch": 5.03, + "eval_loss": 1.0162479877471924, + "eval_runtime": 517.0801, + "eval_samples_per_second": 14.773, + "eval_wer": 0.3531833385745733, + "step": 34000 + }, + { + "epoch": 5.03, + "learning_rate": 7.511869436201781e-06, + "loss": 1.0572, + "step": 34040 + }, + { + "epoch": 5.03, + "eval_loss": 0.9946324229240417, + "eval_runtime": 517.7569, + "eval_samples_per_second": 14.754, + "eval_wer": 0.3513536693444638, + "step": 34040 + }, + { + "epoch": 5.04, + "learning_rate": 7.508902077151335e-06, + "loss": 1.0921, + "step": 34080 + }, + { + "epoch": 5.04, + "eval_loss": 1.0271638631820679, + "eval_runtime": 518.55, + "eval_samples_per_second": 14.731, + "eval_wer": 0.35332628148317563, + "step": 34080 + }, + { + "epoch": 5.04, + "learning_rate": 7.505934718100891e-06, + "loss": 1.1453, + "step": 34120 + }, + { + "epoch": 5.04, + "eval_loss": 0.9695628881454468, + "eval_runtime": 518.3995, + "eval_samples_per_second": 14.736, + "eval_wer": 0.3502958918208068, + "step": 34120 + }, + { + "epoch": 5.05, + "learning_rate": 7.502967359050446e-06, + "loss": 1.063, + "step": 34160 + }, + { + "epoch": 5.05, + "eval_loss": 0.9882568717002869, + "eval_runtime": 518.509, + "eval_samples_per_second": 14.733, + "eval_wer": 0.35043883472940907, + "step": 34160 + }, + { + "epoch": 5.06, + "learning_rate": 7.500000000000001e-06, + "loss": 1.1401, + "step": 34200 + }, + { + "epoch": 5.06, + "eval_loss": 0.9885753393173218, + "eval_runtime": 517.8913, + "eval_samples_per_second": 14.75, + "eval_wer": 0.3510106063638183, + "step": 34200 + }, + { + "epoch": 5.06, + "learning_rate": 7.4970326409495555e-06, + "loss": 0.9794, + "step": 34240 + }, + { + "epoch": 5.06, + "eval_loss": 1.0146777629852295, + "eval_runtime": 516.2923, + "eval_samples_per_second": 14.796, + "eval_wer": 0.3526115669401641, + "step": 34240 + }, + { + "epoch": 5.07, + "learning_rate": 7.49406528189911e-06, + "loss": 1.0487, + "step": 34280 + }, + { + "epoch": 5.07, + "eval_loss": 1.0674594640731812, + "eval_runtime": 517.2338, + "eval_samples_per_second": 14.769, + "eval_wer": 0.3569856199433946, + "step": 34280 + }, + { + "epoch": 5.07, + "learning_rate": 7.491097922848666e-06, + "loss": 1.0536, + "step": 34320 + }, + { + "epoch": 5.07, + "eval_loss": 1.0534114837646484, + "eval_runtime": 517.1946, + "eval_samples_per_second": 14.77, + "eval_wer": 0.35547042511221016, + "step": 34320 + }, + { + "epoch": 5.08, + "learning_rate": 7.4881305637982205e-06, + "loss": 1.1235, + "step": 34360 + }, + { + "epoch": 5.08, + "eval_loss": 0.9636272192001343, + "eval_runtime": 517.4714, + "eval_samples_per_second": 14.762, + "eval_wer": 0.35075330912833413, + "step": 34360 + }, + { + "epoch": 5.08, + "learning_rate": 7.485163204747775e-06, + "loss": 1.0312, + "step": 34400 + }, + { + "epoch": 5.08, + "eval_loss": 1.0136626958847046, + "eval_runtime": 517.7844, + "eval_samples_per_second": 14.753, + "eval_wer": 0.35229709254123903, + "step": 34400 + }, + { + "epoch": 5.09, + "learning_rate": 7.48219584569733e-06, + "loss": 1.0324, + "step": 34440 + }, + { + "epoch": 5.09, + "eval_loss": 1.0350545644760132, + "eval_runtime": 519.1542, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3527830984304869, + "step": 34440 + }, + { + "epoch": 5.1, + "learning_rate": 7.479228486646885e-06, + "loss": 1.0169, + "step": 34480 + }, + { + "epoch": 5.1, + "eval_loss": 1.0412139892578125, + "eval_runtime": 517.9301, + "eval_samples_per_second": 14.749, + "eval_wer": 0.35395523028102577, + "step": 34480 + }, + { + "epoch": 5.1, + "learning_rate": 7.47626112759644e-06, + "loss": 1.1422, + "step": 34520 + }, + { + "epoch": 5.1, + "eval_loss": 0.9540519118309021, + "eval_runtime": 518.1075, + "eval_samples_per_second": 14.744, + "eval_wer": 0.3476371537208039, + "step": 34520 + }, + { + "epoch": 5.11, + "learning_rate": 7.473293768545995e-06, + "loss": 1.0446, + "step": 34560 + }, + { + "epoch": 5.11, + "eval_loss": 1.0365962982177734, + "eval_runtime": 518.3603, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3527545098487664, + "step": 34560 + }, + { + "epoch": 5.11, + "learning_rate": 7.47032640949555e-06, + "loss": 1.0254, + "step": 34600 + }, + { + "epoch": 5.11, + "eval_loss": 0.9772912859916687, + "eval_runtime": 518.9491, + "eval_samples_per_second": 14.72, + "eval_wer": 0.34975270876811804, + "step": 34600 + }, + { + "epoch": 5.12, + "learning_rate": 7.467359050445104e-06, + "loss": 1.0092, + "step": 34640 + }, + { + "epoch": 5.12, + "eval_loss": 1.043649673461914, + "eval_runtime": 517.8798, + "eval_samples_per_second": 14.751, + "eval_wer": 0.3537265216272621, + "step": 34640 + }, + { + "epoch": 5.13, + "learning_rate": 7.464391691394659e-06, + "loss": 1.0876, + "step": 34680 + }, + { + "epoch": 5.13, + "eval_loss": 0.9765923023223877, + "eval_runtime": 518.7418, + "eval_samples_per_second": 14.726, + "eval_wer": 0.34920952571542924, + "step": 34680 + }, + { + "epoch": 5.13, + "learning_rate": 7.461424332344214e-06, + "loss": 1.069, + "step": 34720 + }, + { + "epoch": 5.13, + "eval_loss": 0.9477208852767944, + "eval_runtime": 518.8334, + "eval_samples_per_second": 14.723, + "eval_wer": 0.3474942108122016, + "step": 34720 + }, + { + "epoch": 5.14, + "learning_rate": 7.458456973293769e-06, + "loss": 1.1168, + "step": 34760 + }, + { + "epoch": 5.14, + "eval_loss": 0.9617806077003479, + "eval_runtime": 517.7851, + "eval_samples_per_second": 14.753, + "eval_wer": 0.34760856513908345, + "step": 34760 + }, + { + "epoch": 5.14, + "learning_rate": 7.4554896142433244e-06, + "loss": 1.0914, + "step": 34800 + }, + { + "epoch": 5.14, + "eval_loss": 0.9582235813140869, + "eval_runtime": 518.163, + "eval_samples_per_second": 14.742, + "eval_wer": 0.34752279939392205, + "step": 34800 + }, + { + "epoch": 5.15, + "learning_rate": 7.452522255192879e-06, + "loss": 1.0557, + "step": 34840 + }, + { + "epoch": 5.15, + "eval_loss": 1.0293325185775757, + "eval_runtime": 517.7021, + "eval_samples_per_second": 14.756, + "eval_wer": 0.35258297835844365, + "step": 34840 + }, + { + "epoch": 5.16, + "learning_rate": 7.449554896142433e-06, + "loss": 1.0488, + "step": 34880 + }, + { + "epoch": 5.16, + "eval_loss": 0.9313080906867981, + "eval_runtime": 518.8983, + "eval_samples_per_second": 14.722, + "eval_wer": 0.3458646616541353, + "step": 34880 + }, + { + "epoch": 5.16, + "learning_rate": 7.446587537091989e-06, + "loss": 0.9922, + "step": 34920 + }, + { + "epoch": 5.16, + "eval_loss": 0.9609341621398926, + "eval_runtime": 518.2574, + "eval_samples_per_second": 14.74, + "eval_wer": 0.34723691357671743, + "step": 34920 + }, + { + "epoch": 5.17, + "learning_rate": 7.443620178041544e-06, + "loss": 0.9995, + "step": 34960 + }, + { + "epoch": 5.17, + "eval_loss": 0.9943296313285828, + "eval_runtime": 518.6736, + "eval_samples_per_second": 14.728, + "eval_wer": 0.35026730323908634, + "step": 34960 + }, + { + "epoch": 5.17, + "learning_rate": 7.440652818991098e-06, + "loss": 1.0805, + "step": 35000 + }, + { + "epoch": 5.17, + "eval_loss": 0.9770107865333557, + "eval_runtime": 518.9683, + "eval_samples_per_second": 14.72, + "eval_wer": 0.3495240001143543, + "step": 35000 + }, + { + "epoch": 5.18, + "learning_rate": 7.437685459940654e-06, + "loss": 0.9962, + "step": 35040 + }, + { + "epoch": 5.18, + "eval_loss": 1.0198523998260498, + "eval_runtime": 518.5574, + "eval_samples_per_second": 14.731, + "eval_wer": 0.35292604133908917, + "step": 35040 + }, + { + "epoch": 5.19, + "learning_rate": 7.434718100890208e-06, + "loss": 1.0321, + "step": 35080 + }, + { + "epoch": 5.19, + "eval_loss": 1.0129917860031128, + "eval_runtime": 519.8093, + "eval_samples_per_second": 14.696, + "eval_wer": 0.35349781297349836, + "step": 35080 + }, + { + "epoch": 5.19, + "learning_rate": 7.4317507418397625e-06, + "loss": 1.118, + "step": 35120 + }, + { + "epoch": 5.19, + "eval_loss": 1.0629512071609497, + "eval_runtime": 518.301, + "eval_samples_per_second": 14.739, + "eval_wer": 0.3574144486692015, + "step": 35120 + }, + { + "epoch": 5.2, + "learning_rate": 7.428783382789319e-06, + "loss": 1.0508, + "step": 35160 + }, + { + "epoch": 5.2, + "eval_loss": 1.0058223009109497, + "eval_runtime": 517.6207, + "eval_samples_per_second": 14.758, + "eval_wer": 0.3520969724691958, + "step": 35160 + }, + { + "epoch": 5.2, + "learning_rate": 7.425816023738873e-06, + "loss": 1.0045, + "step": 35200 + }, + { + "epoch": 5.2, + "eval_loss": 1.0579339265823364, + "eval_runtime": 518.1564, + "eval_samples_per_second": 14.743, + "eval_wer": 0.3568712656165128, + "step": 35200 + }, + { + "epoch": 5.21, + "learning_rate": 7.4228486646884275e-06, + "loss": 1.0443, + "step": 35240 + }, + { + "epoch": 5.21, + "eval_loss": 1.0330820083618164, + "eval_runtime": 523.5979, + "eval_samples_per_second": 14.589, + "eval_wer": 0.3536979330455416, + "step": 35240 + }, + { + "epoch": 5.22, + "learning_rate": 7.419881305637983e-06, + "loss": 1.0695, + "step": 35280 + }, + { + "epoch": 5.22, + "eval_loss": 0.953582763671875, + "eval_runtime": 519.6862, + "eval_samples_per_second": 14.699, + "eval_wer": 0.3482375139369336, + "step": 35280 + }, + { + "epoch": 5.22, + "learning_rate": 7.416913946587537e-06, + "loss": 1.0615, + "step": 35320 + }, + { + "epoch": 5.22, + "eval_loss": 1.001886248588562, + "eval_runtime": 519.2387, + "eval_samples_per_second": 14.712, + "eval_wer": 0.35075330912833413, + "step": 35320 + }, + { + "epoch": 5.23, + "learning_rate": 7.413946587537093e-06, + "loss": 1.0839, + "step": 35360 + }, + { + "epoch": 5.23, + "eval_loss": 0.977716863155365, + "eval_runtime": 518.9955, + "eval_samples_per_second": 14.719, + "eval_wer": 0.3491237599702679, + "step": 35360 + }, + { + "epoch": 5.23, + "learning_rate": 7.410979228486648e-06, + "loss": 1.1489, + "step": 35400 + }, + { + "epoch": 5.23, + "eval_loss": 0.9676298499107361, + "eval_runtime": 519.66, + "eval_samples_per_second": 14.7, + "eval_wer": 0.3491809371337088, + "step": 35400 + }, + { + "epoch": 5.24, + "learning_rate": 7.408011869436202e-06, + "loss": 1.0194, + "step": 35440 + }, + { + "epoch": 5.24, + "eval_loss": 1.0061874389648438, + "eval_runtime": 517.9794, + "eval_samples_per_second": 14.748, + "eval_wer": 0.3507818977100546, + "step": 35440 + }, + { + "epoch": 5.24, + "learning_rate": 7.405044510385757e-06, + "loss": 0.9936, + "step": 35480 + }, + { + "epoch": 5.24, + "eval_loss": 0.9882224202156067, + "eval_runtime": 522.0087, + "eval_samples_per_second": 14.634, + "eval_wer": 0.34940964578747247, + "step": 35480 + }, + { + "epoch": 5.25, + "learning_rate": 7.402077151335312e-06, + "loss": 1.1233, + "step": 35520 + }, + { + "epoch": 5.25, + "eval_loss": 0.9520732760429382, + "eval_runtime": 518.8311, + "eval_samples_per_second": 14.723, + "eval_wer": 0.3473226793218788, + "step": 35520 + }, + { + "epoch": 5.26, + "learning_rate": 7.399109792284867e-06, + "loss": 1.0233, + "step": 35560 + }, + { + "epoch": 5.26, + "eval_loss": 1.0154160261154175, + "eval_runtime": 519.0201, + "eval_samples_per_second": 14.718, + "eval_wer": 0.35095342920037736, + "step": 35560 + }, + { + "epoch": 5.26, + "learning_rate": 7.396142433234423e-06, + "loss": 1.0205, + "step": 35600 + }, + { + "epoch": 5.26, + "eval_loss": 0.9261102080345154, + "eval_runtime": 519.1592, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3455215986734898, + "step": 35600 + }, + { + "epoch": 5.27, + "learning_rate": 7.393175074183977e-06, + "loss": 1.0896, + "step": 35640 + }, + { + "epoch": 5.27, + "eval_loss": 1.0003314018249512, + "eval_runtime": 524.6736, + "eval_samples_per_second": 14.56, + "eval_wer": 0.3500671831670431, + "step": 35640 + }, + { + "epoch": 5.27, + "learning_rate": 7.3902077151335315e-06, + "loss": 1.1448, + "step": 35680 + }, + { + "epoch": 5.27, + "eval_loss": 0.9583069682121277, + "eval_runtime": 530.3884, + "eval_samples_per_second": 14.403, + "eval_wer": 0.3467794962691901, + "step": 35680 + }, + { + "epoch": 5.28, + "learning_rate": 7.387240356083086e-06, + "loss": 1.1322, + "step": 35720 + }, + { + "epoch": 5.28, + "eval_loss": 0.9848551750183105, + "eval_runtime": 522.9458, + "eval_samples_per_second": 14.608, + "eval_wer": 0.34889505131650417, + "step": 35720 + }, + { + "epoch": 5.29, + "learning_rate": 7.384272997032641e-06, + "loss": 1.1239, + "step": 35760 + }, + { + "epoch": 5.29, + "eval_loss": 1.0303740501403809, + "eval_runtime": 522.13, + "eval_samples_per_second": 14.63, + "eval_wer": 0.35198261814231396, + "step": 35760 + }, + { + "epoch": 5.29, + "learning_rate": 7.3813056379821965e-06, + "loss": 1.0135, + "step": 35800 + }, + { + "epoch": 5.29, + "eval_loss": 0.9914101362228394, + "eval_runtime": 636.7612, + "eval_samples_per_second": 11.997, + "eval_wer": 0.34872351982618144, + "step": 35800 + }, + { + "epoch": 5.3, + "learning_rate": 7.378338278931752e-06, + "loss": 1.0298, + "step": 35840 + }, + { + "epoch": 5.3, + "eval_loss": 0.9857242107391357, + "eval_runtime": 518.0932, + "eval_samples_per_second": 14.744, + "eval_wer": 0.34775150804768573, + "step": 35840 + }, + { + "epoch": 5.3, + "learning_rate": 7.375370919881306e-06, + "loss": 0.9808, + "step": 35880 + }, + { + "epoch": 5.3, + "eval_loss": 1.0449692010879517, + "eval_runtime": 516.9669, + "eval_samples_per_second": 14.777, + "eval_wer": 0.35075330912833413, + "step": 35880 + }, + { + "epoch": 5.31, + "learning_rate": 7.372403560830861e-06, + "loss": 0.9924, + "step": 35920 + }, + { + "epoch": 5.31, + "eval_loss": 1.0501301288604736, + "eval_runtime": 522.7881, + "eval_samples_per_second": 14.612, + "eval_wer": 0.3517253209068298, + "step": 35920 + }, + { + "epoch": 5.32, + "learning_rate": 7.369436201780415e-06, + "loss": 1.1162, + "step": 35960 + }, + { + "epoch": 5.32, + "eval_loss": 1.015513300895691, + "eval_runtime": 518.2215, + "eval_samples_per_second": 14.741, + "eval_wer": 0.3493238800423111, + "step": 35960 + }, + { + "epoch": 5.32, + "learning_rate": 7.366468842729971e-06, + "loss": 1.187, + "step": 36000 + }, + { + "epoch": 5.32, + "eval_loss": 0.9844435453414917, + "eval_runtime": 517.7293, + "eval_samples_per_second": 14.755, + "eval_wer": 0.3484376340089768, + "step": 36000 + }, + { + "epoch": 5.33, + "learning_rate": 7.363501483679526e-06, + "loss": 1.0584, + "step": 36040 + }, + { + "epoch": 5.33, + "eval_loss": 0.9944560527801514, + "eval_runtime": 518.3905, + "eval_samples_per_second": 14.736, + "eval_wer": 0.3488378741530633, + "step": 36040 + }, + { + "epoch": 5.33, + "learning_rate": 7.360534124629081e-06, + "loss": 0.9844, + "step": 36080 + }, + { + "epoch": 5.33, + "eval_loss": 1.0248990058898926, + "eval_runtime": 517.7808, + "eval_samples_per_second": 14.753, + "eval_wer": 0.3498956516767203, + "step": 36080 + }, + { + "epoch": 5.34, + "learning_rate": 7.3575667655786354e-06, + "loss": 1.063, + "step": 36120 + }, + { + "epoch": 5.34, + "eval_loss": 0.9436596632003784, + "eval_runtime": 517.9756, + "eval_samples_per_second": 14.748, + "eval_wer": 0.3455215986734898, + "step": 36120 + }, + { + "epoch": 5.35, + "learning_rate": 7.35459940652819e-06, + "loss": 1.0438, + "step": 36160 + }, + { + "epoch": 5.35, + "eval_loss": 1.0605299472808838, + "eval_runtime": 517.4259, + "eval_samples_per_second": 14.763, + "eval_wer": 0.3526973326853255, + "step": 36160 + }, + { + "epoch": 5.35, + "learning_rate": 7.351632047477746e-06, + "loss": 1.0743, + "step": 36200 + }, + { + "epoch": 5.35, + "eval_loss": 0.984839141368866, + "eval_runtime": 518.6786, + "eval_samples_per_second": 14.728, + "eval_wer": 0.34752279939392205, + "step": 36200 + }, + { + "epoch": 5.36, + "learning_rate": 7.3486646884273004e-06, + "loss": 1.0614, + "step": 36240 + }, + { + "epoch": 5.36, + "eval_loss": 1.00856351852417, + "eval_runtime": 517.1187, + "eval_samples_per_second": 14.772, + "eval_wer": 0.34829469110037453, + "step": 36240 + }, + { + "epoch": 5.36, + "learning_rate": 7.345697329376855e-06, + "loss": 1.033, + "step": 36280 + }, + { + "epoch": 5.36, + "eval_loss": 1.031351089477539, + "eval_runtime": 518.7888, + "eval_samples_per_second": 14.725, + "eval_wer": 0.35023871465736583, + "step": 36280 + }, + { + "epoch": 5.37, + "learning_rate": 7.34272997032641e-06, + "loss": 1.0489, + "step": 36320 + }, + { + "epoch": 5.37, + "eval_loss": 0.9767986536026001, + "eval_runtime": 518.2972, + "eval_samples_per_second": 14.739, + "eval_wer": 0.34695102775951286, + "step": 36320 + }, + { + "epoch": 5.37, + "learning_rate": 7.339762611275965e-06, + "loss": 1.1508, + "step": 36360 + }, + { + "epoch": 5.37, + "eval_loss": 0.9689246416091919, + "eval_runtime": 519.5598, + "eval_samples_per_second": 14.703, + "eval_wer": 0.3466365533605878, + "step": 36360 + }, + { + "epoch": 5.38, + "learning_rate": 7.336795252225521e-06, + "loss": 1.0752, + "step": 36400 + }, + { + "epoch": 5.38, + "eval_loss": 0.9996673464775085, + "eval_runtime": 518.569, + "eval_samples_per_second": 14.731, + "eval_wer": 0.3479230395380085, + "step": 36400 + }, + { + "epoch": 5.39, + "learning_rate": 7.333827893175075e-06, + "loss": 1.0955, + "step": 36440 + }, + { + "epoch": 5.39, + "eval_loss": 0.9890244007110596, + "eval_runtime": 518.2003, + "eval_samples_per_second": 14.741, + "eval_wer": 0.3468080848509105, + "step": 36440 + }, + { + "epoch": 5.39, + "learning_rate": 7.33086053412463e-06, + "loss": 1.1708, + "step": 36480 + }, + { + "epoch": 5.39, + "eval_loss": 0.9723288416862488, + "eval_runtime": 517.3425, + "eval_samples_per_second": 14.766, + "eval_wer": 0.34666514194230824, + "step": 36480 + }, + { + "epoch": 5.4, + "learning_rate": 7.327893175074184e-06, + "loss": 1.0326, + "step": 36520 + }, + { + "epoch": 5.4, + "eval_loss": 0.98514324426651, + "eval_runtime": 523.5992, + "eval_samples_per_second": 14.589, + "eval_wer": 0.34692243917779236, + "step": 36520 + }, + { + "epoch": 5.4, + "learning_rate": 7.324925816023739e-06, + "loss": 1.1057, + "step": 36560 + }, + { + "epoch": 5.4, + "eval_loss": 0.9577740430831909, + "eval_runtime": 517.0791, + "eval_samples_per_second": 14.773, + "eval_wer": 0.3455215986734898, + "step": 36560 + }, + { + "epoch": 5.41, + "learning_rate": 7.321958456973295e-06, + "loss": 1.0094, + "step": 36600 + }, + { + "epoch": 5.41, + "eval_loss": 1.0130566358566284, + "eval_runtime": 517.523, + "eval_samples_per_second": 14.761, + "eval_wer": 0.3481803367734927, + "step": 36600 + }, + { + "epoch": 5.42, + "learning_rate": 7.31899109792285e-06, + "loss": 1.0692, + "step": 36640 + }, + { + "epoch": 5.42, + "eval_loss": 0.9417288899421692, + "eval_runtime": 517.4106, + "eval_samples_per_second": 14.764, + "eval_wer": 0.3452357128562852, + "step": 36640 + }, + { + "epoch": 5.42, + "learning_rate": 7.316023738872404e-06, + "loss": 1.0994, + "step": 36680 + }, + { + "epoch": 5.42, + "eval_loss": 0.9934326410293579, + "eval_runtime": 517.4953, + "eval_samples_per_second": 14.761, + "eval_wer": 0.34737985648531977, + "step": 36680 + }, + { + "epoch": 5.43, + "learning_rate": 7.313056379821959e-06, + "loss": 1.0447, + "step": 36720 + }, + { + "epoch": 5.43, + "eval_loss": 0.9766961932182312, + "eval_runtime": 518.6527, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3461791360530604, + "step": 36720 + }, + { + "epoch": 5.43, + "learning_rate": 7.310089020771513e-06, + "loss": 1.0525, + "step": 36760 + }, + { + "epoch": 5.43, + "eval_loss": 0.9443075060844421, + "eval_runtime": 516.1217, + "eval_samples_per_second": 14.801, + "eval_wer": 0.3450927699476829, + "step": 36760 + }, + { + "epoch": 5.44, + "learning_rate": 7.3071216617210686e-06, + "loss": 1.0807, + "step": 36800 + }, + { + "epoch": 5.44, + "eval_loss": 1.0100418329238892, + "eval_runtime": 516.7653, + "eval_samples_per_second": 14.782, + "eval_wer": 0.34803739386489035, + "step": 36800 + }, + { + "epoch": 5.45, + "learning_rate": 7.304154302670624e-06, + "loss": 1.11, + "step": 36840 + }, + { + "epoch": 5.45, + "eval_loss": 1.0191208124160767, + "eval_runtime": 518.2851, + "eval_samples_per_second": 14.739, + "eval_wer": 0.3510677835272592, + "step": 36840 + }, + { + "epoch": 5.45, + "learning_rate": 7.301186943620179e-06, + "loss": 1.0485, + "step": 36880 + }, + { + "epoch": 5.45, + "eval_loss": 0.9987328052520752, + "eval_runtime": 519.6238, + "eval_samples_per_second": 14.701, + "eval_wer": 0.34892363989822467, + "step": 36880 + }, + { + "epoch": 5.46, + "learning_rate": 7.298219584569734e-06, + "loss": 1.105, + "step": 36920 + }, + { + "epoch": 5.46, + "eval_loss": 0.9528825879096985, + "eval_runtime": 517.7327, + "eval_samples_per_second": 14.755, + "eval_wer": 0.34503559278424195, + "step": 36920 + }, + { + "epoch": 5.46, + "learning_rate": 7.295252225519288e-06, + "loss": 1.0527, + "step": 36960 + }, + { + "epoch": 5.46, + "eval_loss": 0.9805234670639038, + "eval_runtime": 519.2908, + "eval_samples_per_second": 14.71, + "eval_wer": 0.34695102775951286, + "step": 36960 + }, + { + "epoch": 5.47, + "learning_rate": 7.2922848664688425e-06, + "loss": 1.1002, + "step": 37000 + }, + { + "epoch": 5.47, + "eval_loss": 0.9213802218437195, + "eval_runtime": 517.5742, + "eval_samples_per_second": 14.759, + "eval_wer": 0.3428914491552074, + "step": 37000 + }, + { + "epoch": 5.48, + "learning_rate": 7.289317507418399e-06, + "loss": 1.0848, + "step": 37040 + }, + { + "epoch": 5.48, + "eval_loss": 0.9836987257003784, + "eval_runtime": 517.8899, + "eval_samples_per_second": 14.75, + "eval_wer": 0.34880928557134283, + "step": 37040 + }, + { + "epoch": 5.48, + "learning_rate": 7.286350148367953e-06, + "loss": 1.1237, + "step": 37080 + }, + { + "epoch": 5.48, + "eval_loss": 0.9189736843109131, + "eval_runtime": 517.163, + "eval_samples_per_second": 14.771, + "eval_wer": 0.3433202778810143, + "step": 37080 + }, + { + "epoch": 5.49, + "learning_rate": 7.283382789317508e-06, + "loss": 1.0362, + "step": 37120 + }, + { + "epoch": 5.49, + "eval_loss": 0.9509996771812439, + "eval_runtime": 518.7047, + "eval_samples_per_second": 14.727, + "eval_wer": 0.3453214786014466, + "step": 37120 + }, + { + "epoch": 5.49, + "learning_rate": 7.280415430267063e-06, + "loss": 1.0578, + "step": 37160 + }, + { + "epoch": 5.49, + "eval_loss": 0.9367378354072571, + "eval_runtime": 518.0235, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3444352325681123, + "step": 37160 + }, + { + "epoch": 5.5, + "learning_rate": 7.277448071216617e-06, + "loss": 1.0191, + "step": 37200 + }, + { + "epoch": 5.5, + "eval_loss": 1.0272654294967651, + "eval_runtime": 519.302, + "eval_samples_per_second": 14.71, + "eval_wer": 0.35138225792618427, + "step": 37200 + }, + { + "epoch": 5.5, + "learning_rate": 7.274480712166173e-06, + "loss": 1.0812, + "step": 37240 + }, + { + "epoch": 5.5, + "eval_loss": 0.9841765761375427, + "eval_runtime": 516.997, + "eval_samples_per_second": 14.776, + "eval_wer": 0.34737985648531977, + "step": 37240 + }, + { + "epoch": 5.51, + "learning_rate": 7.271513353115728e-06, + "loss": 1.0821, + "step": 37280 + }, + { + "epoch": 5.51, + "eval_loss": 0.9411097764968872, + "eval_runtime": 516.8692, + "eval_samples_per_second": 14.779, + "eval_wer": 0.3449498270390806, + "step": 37280 + }, + { + "epoch": 5.52, + "learning_rate": 7.268545994065282e-06, + "loss": 1.1125, + "step": 37320 + }, + { + "epoch": 5.52, + "eval_loss": 0.9436768889427185, + "eval_runtime": 516.5002, + "eval_samples_per_second": 14.79, + "eval_wer": 0.3450927699476829, + "step": 37320 + }, + { + "epoch": 5.52, + "learning_rate": 7.2655786350148375e-06, + "loss": 1.02, + "step": 37360 + }, + { + "epoch": 5.52, + "eval_loss": 0.9287549257278442, + "eval_runtime": 519.025, + "eval_samples_per_second": 14.718, + "eval_wer": 0.3436347522799394, + "step": 37360 + }, + { + "epoch": 5.53, + "learning_rate": 7.262611275964392e-06, + "loss": 1.0961, + "step": 37400 + }, + { + "epoch": 5.53, + "eval_loss": 0.9613959193229675, + "eval_runtime": 516.7946, + "eval_samples_per_second": 14.782, + "eval_wer": 0.34606478172617855, + "step": 37400 + }, + { + "epoch": 5.53, + "learning_rate": 7.259643916913947e-06, + "loss": 1.0848, + "step": 37440 + }, + { + "epoch": 5.53, + "eval_loss": 0.9598263502120972, + "eval_runtime": 517.5735, + "eval_samples_per_second": 14.759, + "eval_wer": 0.3456645415820921, + "step": 37440 + }, + { + "epoch": 5.54, + "learning_rate": 7.2566765578635025e-06, + "loss": 1.103, + "step": 37480 + }, + { + "epoch": 5.54, + "eval_loss": 0.9258189797401428, + "eval_runtime": 517.1644, + "eval_samples_per_second": 14.771, + "eval_wer": 0.34309156922725065, + "step": 37480 + }, + { + "epoch": 5.55, + "learning_rate": 7.253709198813057e-06, + "loss": 1.0648, + "step": 37520 + }, + { + "epoch": 5.55, + "eval_loss": 0.9476194977760315, + "eval_runtime": 517.3108, + "eval_samples_per_second": 14.767, + "eval_wer": 0.34512135852940334, + "step": 37520 + }, + { + "epoch": 5.55, + "learning_rate": 7.2507418397626114e-06, + "loss": 1.0217, + "step": 37560 + }, + { + "epoch": 5.55, + "eval_loss": 0.9669373631477356, + "eval_runtime": 516.2075, + "eval_samples_per_second": 14.798, + "eval_wer": 0.3465507876154264, + "step": 37560 + }, + { + "epoch": 5.56, + "learning_rate": 7.247774480712167e-06, + "loss": 1.1069, + "step": 37600 + }, + { + "epoch": 5.56, + "eval_loss": 0.9176297187805176, + "eval_runtime": 518.363, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3434060436261757, + "step": 37600 + }, + { + "epoch": 5.56, + "learning_rate": 7.244807121661722e-06, + "loss": 1.0155, + "step": 37640 + }, + { + "epoch": 5.56, + "eval_loss": 0.9762797951698303, + "eval_runtime": 516.6601, + "eval_samples_per_second": 14.785, + "eval_wer": 0.3463792561251036, + "step": 37640 + }, + { + "epoch": 5.57, + "learning_rate": 7.2418397626112765e-06, + "loss": 1.0548, + "step": 37680 + }, + { + "epoch": 5.57, + "eval_loss": 0.9596333503723145, + "eval_runtime": 517.415, + "eval_samples_per_second": 14.764, + "eval_wer": 0.3453214786014466, + "step": 37680 + }, + { + "epoch": 5.58, + "learning_rate": 7.238872403560832e-06, + "loss": 0.997, + "step": 37720 + }, + { + "epoch": 5.58, + "eval_loss": 0.9662673473358154, + "eval_runtime": 519.48, + "eval_samples_per_second": 14.705, + "eval_wer": 0.3449498270390806, + "step": 37720 + }, + { + "epoch": 5.58, + "learning_rate": 7.235905044510386e-06, + "loss": 0.9654, + "step": 37760 + }, + { + "epoch": 5.58, + "eval_loss": 1.0204555988311768, + "eval_runtime": 518.7412, + "eval_samples_per_second": 14.726, + "eval_wer": 0.3490379942251065, + "step": 37760 + }, + { + "epoch": 5.59, + "learning_rate": 7.232937685459941e-06, + "loss": 0.9863, + "step": 37800 + }, + { + "epoch": 5.59, + "eval_loss": 1.0025908946990967, + "eval_runtime": 518.389, + "eval_samples_per_second": 14.736, + "eval_wer": 0.3480945710283313, + "step": 37800 + }, + { + "epoch": 5.59, + "learning_rate": 7.229970326409496e-06, + "loss": 1.017, + "step": 37840 + }, + { + "epoch": 5.59, + "eval_loss": 0.9650992751121521, + "eval_runtime": 519.2911, + "eval_samples_per_second": 14.71, + "eval_wer": 0.34412075816918725, + "step": 37840 + }, + { + "epoch": 5.6, + "learning_rate": 7.227002967359051e-06, + "loss": 1.0817, + "step": 37880 + }, + { + "epoch": 5.6, + "eval_loss": 0.9527426362037659, + "eval_runtime": 517.9839, + "eval_samples_per_second": 14.748, + "eval_wer": 0.3429772149003688, + "step": 37880 + }, + { + "epoch": 5.61, + "learning_rate": 7.224035608308606e-06, + "loss": 1.095, + "step": 37920 + }, + { + "epoch": 5.61, + "eval_loss": 0.9103830456733704, + "eval_runtime": 518.0981, + "eval_samples_per_second": 14.744, + "eval_wer": 0.34089024843477517, + "step": 37920 + }, + { + "epoch": 5.61, + "learning_rate": 7.221068249258161e-06, + "loss": 1.064, + "step": 37960 + }, + { + "epoch": 5.61, + "eval_loss": 0.952324628829956, + "eval_runtime": 519.75, + "eval_samples_per_second": 14.697, + "eval_wer": 0.34366334086165984, + "step": 37960 + }, + { + "epoch": 5.62, + "learning_rate": 7.218100890207715e-06, + "loss": 0.9916, + "step": 38000 + }, + { + "epoch": 5.62, + "eval_loss": 0.9753944277763367, + "eval_runtime": 518.9416, + "eval_samples_per_second": 14.72, + "eval_wer": 0.34503559278424195, + "step": 38000 + }, + { + "epoch": 5.62, + "learning_rate": 7.21513353115727e-06, + "loss": 1.0613, + "step": 38040 + }, + { + "epoch": 5.62, + "eval_loss": 0.9474734663963318, + "eval_runtime": 518.4558, + "eval_samples_per_second": 14.734, + "eval_wer": 0.34334886646273477, + "step": 38040 + }, + { + "epoch": 5.63, + "learning_rate": 7.212166172106826e-06, + "loss": 1.0493, + "step": 38080 + }, + { + "epoch": 5.63, + "eval_loss": 0.9691063165664673, + "eval_runtime": 518.9537, + "eval_samples_per_second": 14.72, + "eval_wer": 0.3443208782412305, + "step": 38080 + }, + { + "epoch": 5.63, + "learning_rate": 7.20919881305638e-06, + "loss": 1.069, + "step": 38120 + }, + { + "epoch": 5.63, + "eval_loss": 0.9744353890419006, + "eval_runtime": 517.2876, + "eval_samples_per_second": 14.767, + "eval_wer": 0.34512135852940334, + "step": 38120 + }, + { + "epoch": 5.64, + "learning_rate": 7.206231454005936e-06, + "loss": 0.9912, + "step": 38160 + }, + { + "epoch": 5.64, + "eval_loss": 1.00869882106781, + "eval_runtime": 518.0533, + "eval_samples_per_second": 14.746, + "eval_wer": 0.34775150804768573, + "step": 38160 + }, + { + "epoch": 5.65, + "learning_rate": 7.20326409495549e-06, + "loss": 1.1896, + "step": 38200 + }, + { + "epoch": 5.65, + "eval_loss": 0.945558488368988, + "eval_runtime": 521.2602, + "eval_samples_per_second": 14.655, + "eval_wer": 0.34257697475628235, + "step": 38200 + }, + { + "epoch": 5.65, + "learning_rate": 7.2002967359050446e-06, + "loss": 1.0302, + "step": 38240 + }, + { + "epoch": 5.65, + "eval_loss": 0.9520701766014099, + "eval_runtime": 519.2605, + "eval_samples_per_second": 14.711, + "eval_wer": 0.3434632207896166, + "step": 38240 + }, + { + "epoch": 5.66, + "learning_rate": 7.197329376854601e-06, + "loss": 1.0106, + "step": 38280 + }, + { + "epoch": 5.66, + "eval_loss": 1.0306862592697144, + "eval_runtime": 522.5575, + "eval_samples_per_second": 14.618, + "eval_wer": 0.3498384745132794, + "step": 38280 + }, + { + "epoch": 5.66, + "learning_rate": 7.194362017804155e-06, + "loss": 1.0132, + "step": 38320 + }, + { + "epoch": 5.66, + "eval_loss": 0.9693185091018677, + "eval_runtime": 517.7995, + "eval_samples_per_second": 14.753, + "eval_wer": 0.3456073644186512, + "step": 38320 + }, + { + "epoch": 5.67, + "learning_rate": 7.19139465875371e-06, + "loss": 1.1024, + "step": 38360 + }, + { + "epoch": 5.67, + "eval_loss": 0.9740729331970215, + "eval_runtime": 519.5555, + "eval_samples_per_second": 14.703, + "eval_wer": 0.34452099831327365, + "step": 38360 + }, + { + "epoch": 5.68, + "learning_rate": 7.188427299703265e-06, + "loss": 1.0674, + "step": 38400 + }, + { + "epoch": 5.68, + "eval_loss": 0.9593319892883301, + "eval_runtime": 519.1492, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3449212384573601, + "step": 38400 + }, + { + "epoch": 5.68, + "learning_rate": 7.185459940652819e-06, + "loss": 1.076, + "step": 38440 + }, + { + "epoch": 5.68, + "eval_loss": 0.975508451461792, + "eval_runtime": 519.4455, + "eval_samples_per_second": 14.706, + "eval_wer": 0.34512135852940334, + "step": 38440 + }, + { + "epoch": 5.69, + "learning_rate": 7.182492581602375e-06, + "loss": 1.0063, + "step": 38480 + }, + { + "epoch": 5.69, + "eval_loss": 0.98208087682724, + "eval_runtime": 518.2571, + "eval_samples_per_second": 14.74, + "eval_wer": 0.3452643014380057, + "step": 38480 + }, + { + "epoch": 5.69, + "learning_rate": 7.17952522255193e-06, + "loss": 1.0995, + "step": 38520 + }, + { + "epoch": 5.69, + "eval_loss": 1.0282764434814453, + "eval_runtime": 519.4153, + "eval_samples_per_second": 14.707, + "eval_wer": 0.3498956516767203, + "step": 38520 + }, + { + "epoch": 5.7, + "learning_rate": 7.176557863501484e-06, + "loss": 1.0265, + "step": 38560 + }, + { + "epoch": 5.7, + "eval_loss": 1.0229235887527466, + "eval_runtime": 518.2115, + "eval_samples_per_second": 14.741, + "eval_wer": 0.3502958918208068, + "step": 38560 + }, + { + "epoch": 5.71, + "learning_rate": 7.173590504451039e-06, + "loss": 1.2228, + "step": 38600 + }, + { + "epoch": 5.71, + "eval_loss": 0.9659146070480347, + "eval_runtime": 517.9214, + "eval_samples_per_second": 14.749, + "eval_wer": 0.3456645415820921, + "step": 38600 + }, + { + "epoch": 5.71, + "learning_rate": 7.170623145400594e-06, + "loss": 1.093, + "step": 38640 + }, + { + "epoch": 5.71, + "eval_loss": 0.9389090538024902, + "eval_runtime": 519.044, + "eval_samples_per_second": 14.717, + "eval_wer": 0.34317733497241204, + "step": 38640 + }, + { + "epoch": 5.72, + "learning_rate": 7.167655786350149e-06, + "loss": 1.0796, + "step": 38680 + }, + { + "epoch": 5.72, + "eval_loss": 0.9630261063575745, + "eval_runtime": 517.78, + "eval_samples_per_second": 14.753, + "eval_wer": 0.3451785356928443, + "step": 38680 + }, + { + "epoch": 5.72, + "learning_rate": 7.164688427299704e-06, + "loss": 1.122, + "step": 38720 + }, + { + "epoch": 5.72, + "eval_loss": 0.9763597846031189, + "eval_runtime": 518.1935, + "eval_samples_per_second": 14.742, + "eval_wer": 0.3462649017982218, + "step": 38720 + }, + { + "epoch": 5.73, + "learning_rate": 7.161721068249259e-06, + "loss": 1.0532, + "step": 38760 + }, + { + "epoch": 5.73, + "eval_loss": 0.9626193046569824, + "eval_runtime": 518.6468, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3449212384573601, + "step": 38760 + }, + { + "epoch": 5.74, + "learning_rate": 7.1587537091988135e-06, + "loss": 1.1039, + "step": 38800 + }, + { + "epoch": 5.74, + "eval_loss": 0.8972166180610657, + "eval_runtime": 519.4824, + "eval_samples_per_second": 14.705, + "eval_wer": 0.3413190771605821, + "step": 38800 + }, + { + "epoch": 5.74, + "learning_rate": 7.155786350148368e-06, + "loss": 1.1073, + "step": 38840 + }, + { + "epoch": 5.74, + "eval_loss": 0.9370134472846985, + "eval_runtime": 518.3432, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3436347522799394, + "step": 38840 + }, + { + "epoch": 5.75, + "learning_rate": 7.152818991097923e-06, + "loss": 1.0676, + "step": 38880 + }, + { + "epoch": 5.75, + "eval_loss": 0.909221351146698, + "eval_runtime": 523.3946, + "eval_samples_per_second": 14.595, + "eval_wer": 0.34189084879499126, + "step": 38880 + }, + { + "epoch": 5.75, + "learning_rate": 7.1498516320474786e-06, + "loss": 1.0693, + "step": 38920 + }, + { + "epoch": 5.75, + "eval_loss": 0.9393254518508911, + "eval_runtime": 520.3931, + "eval_samples_per_second": 14.679, + "eval_wer": 0.3433202778810143, + "step": 38920 + }, + { + "epoch": 5.76, + "learning_rate": 7.146884272997033e-06, + "loss": 1.0178, + "step": 38960 + }, + { + "epoch": 5.76, + "eval_loss": 0.922400712966919, + "eval_runtime": 518.8719, + "eval_samples_per_second": 14.722, + "eval_wer": 0.34263415191972324, + "step": 38960 + }, + { + "epoch": 5.76, + "learning_rate": 7.143916913946588e-06, + "loss": 1.0304, + "step": 39000 + }, + { + "epoch": 5.76, + "eval_loss": 0.9404299259185791, + "eval_runtime": 518.0482, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3439778152605849, + "step": 39000 + }, + { + "epoch": 5.77, + "learning_rate": 7.140949554896143e-06, + "loss": 1.1565, + "step": 39040 + }, + { + "epoch": 5.77, + "eval_loss": 0.9346172213554382, + "eval_runtime": 519.4189, + "eval_samples_per_second": 14.707, + "eval_wer": 0.3437205180251008, + "step": 39040 + }, + { + "epoch": 5.78, + "learning_rate": 7.137982195845697e-06, + "loss": 1.003, + "step": 39080 + }, + { + "epoch": 5.78, + "eval_loss": 0.9471651315689087, + "eval_runtime": 518.0277, + "eval_samples_per_second": 14.746, + "eval_wer": 0.34374910660682123, + "step": 39080 + }, + { + "epoch": 5.78, + "learning_rate": 7.135014836795253e-06, + "loss": 1.1173, + "step": 39120 + }, + { + "epoch": 5.78, + "eval_loss": 0.9173640608787537, + "eval_runtime": 522.0102, + "eval_samples_per_second": 14.634, + "eval_wer": 0.34243403184768, + "step": 39120 + }, + { + "epoch": 5.79, + "learning_rate": 7.132047477744808e-06, + "loss": 1.1126, + "step": 39160 + }, + { + "epoch": 5.79, + "eval_loss": 0.9742285013198853, + "eval_runtime": 520.3717, + "eval_samples_per_second": 14.68, + "eval_wer": 0.34829469110037453, + "step": 39160 + }, + { + "epoch": 5.79, + "learning_rate": 7.129080118694362e-06, + "loss": 1.0695, + "step": 39200 + }, + { + "epoch": 5.79, + "eval_loss": 0.9456039071083069, + "eval_runtime": 518.2893, + "eval_samples_per_second": 14.739, + "eval_wer": 0.3448354727121987, + "step": 39200 + }, + { + "epoch": 5.8, + "learning_rate": 7.1261127596439175e-06, + "loss": 1.0757, + "step": 39240 + }, + { + "epoch": 5.8, + "eval_loss": 0.9586562514305115, + "eval_runtime": 518.8031, + "eval_samples_per_second": 14.724, + "eval_wer": 0.3466365533605878, + "step": 39240 + }, + { + "epoch": 5.81, + "learning_rate": 7.123145400593472e-06, + "loss": 1.0876, + "step": 39280 + }, + { + "epoch": 5.81, + "eval_loss": 0.9583691954612732, + "eval_runtime": 519.0526, + "eval_samples_per_second": 14.717, + "eval_wer": 0.34666514194230824, + "step": 39280 + }, + { + "epoch": 5.81, + "learning_rate": 7.120178041543028e-06, + "loss": 1.0168, + "step": 39320 + }, + { + "epoch": 5.81, + "eval_loss": 0.9809749126434326, + "eval_runtime": 520.1078, + "eval_samples_per_second": 14.687, + "eval_wer": 0.347579976557363, + "step": 39320 + }, + { + "epoch": 5.82, + "learning_rate": 7.1172106824925825e-06, + "loss": 1.0805, + "step": 39360 + }, + { + "epoch": 5.82, + "eval_loss": 0.9543889164924622, + "eval_runtime": 523.162, + "eval_samples_per_second": 14.602, + "eval_wer": 0.3453786557648875, + "step": 39360 + }, + { + "epoch": 5.82, + "learning_rate": 7.114243323442137e-06, + "loss": 1.0683, + "step": 39400 + }, + { + "epoch": 5.82, + "eval_loss": 0.9149014949798584, + "eval_runtime": 518.2411, + "eval_samples_per_second": 14.74, + "eval_wer": 0.3426913290831642, + "step": 39400 + }, + { + "epoch": 5.83, + "learning_rate": 7.111275964391691e-06, + "loss": 1.1555, + "step": 39440 + }, + { + "epoch": 5.83, + "eval_loss": 0.9243788123130798, + "eval_runtime": 519.8411, + "eval_samples_per_second": 14.695, + "eval_wer": 0.34317733497241204, + "step": 39440 + }, + { + "epoch": 5.84, + "learning_rate": 7.108308605341247e-06, + "loss": 1.0304, + "step": 39480 + }, + { + "epoch": 5.84, + "eval_loss": 0.9692785739898682, + "eval_runtime": 520.3029, + "eval_samples_per_second": 14.682, + "eval_wer": 0.3456931301638126, + "step": 39480 + }, + { + "epoch": 5.84, + "learning_rate": 7.105341246290802e-06, + "loss": 0.9937, + "step": 39520 + }, + { + "epoch": 5.84, + "eval_loss": 1.015712857246399, + "eval_runtime": 519.5605, + "eval_samples_per_second": 14.703, + "eval_wer": 0.34880928557134283, + "step": 39520 + }, + { + "epoch": 5.85, + "learning_rate": 7.102373887240357e-06, + "loss": 1.036, + "step": 39560 + }, + { + "epoch": 5.85, + "eval_loss": 0.9958353042602539, + "eval_runtime": 520.6191, + "eval_samples_per_second": 14.673, + "eval_wer": 0.34692243917779236, + "step": 39560 + }, + { + "epoch": 5.85, + "learning_rate": 7.099406528189912e-06, + "loss": 1.0741, + "step": 39600 + }, + { + "epoch": 5.85, + "eval_loss": 0.966940701007843, + "eval_runtime": 518.7404, + "eval_samples_per_second": 14.726, + "eval_wer": 0.3450070042025215, + "step": 39600 + }, + { + "epoch": 5.86, + "learning_rate": 7.096439169139466e-06, + "loss": 1.0465, + "step": 39640 + }, + { + "epoch": 5.86, + "eval_loss": 0.9787890911102295, + "eval_runtime": 518.7937, + "eval_samples_per_second": 14.725, + "eval_wer": 0.3459504273992967, + "step": 39640 + }, + { + "epoch": 5.87, + "learning_rate": 7.0934718100890206e-06, + "loss": 0.9698, + "step": 39680 + }, + { + "epoch": 5.87, + "eval_loss": 1.0056897401809692, + "eval_runtime": 517.555, + "eval_samples_per_second": 14.76, + "eval_wer": 0.3485805769175791, + "step": 39680 + }, + { + "epoch": 5.87, + "learning_rate": 7.090504451038577e-06, + "loss": 1.0317, + "step": 39720 + }, + { + "epoch": 5.87, + "eval_loss": 0.9805713891983032, + "eval_runtime": 522.4286, + "eval_samples_per_second": 14.622, + "eval_wer": 0.34643643328854457, + "step": 39720 + }, + { + "epoch": 5.88, + "learning_rate": 7.087537091988131e-06, + "loss": 1.0913, + "step": 39760 + }, + { + "epoch": 5.88, + "eval_loss": 0.9572883248329163, + "eval_runtime": 517.9846, + "eval_samples_per_second": 14.748, + "eval_wer": 0.3444352325681123, + "step": 39760 + }, + { + "epoch": 5.88, + "learning_rate": 7.0845697329376864e-06, + "loss": 1.0677, + "step": 39800 + }, + { + "epoch": 5.88, + "eval_loss": 0.9352319836616516, + "eval_runtime": 519.7277, + "eval_samples_per_second": 14.698, + "eval_wer": 0.34343463220789616, + "step": 39800 + }, + { + "epoch": 5.89, + "learning_rate": 7.081602373887241e-06, + "loss": 0.9991, + "step": 39840 + }, + { + "epoch": 5.89, + "eval_loss": 1.0179932117462158, + "eval_runtime": 522.9266, + "eval_samples_per_second": 14.608, + "eval_wer": 0.35049601189285, + "step": 39840 + }, + { + "epoch": 5.89, + "learning_rate": 7.078635014836795e-06, + "loss": 1.0404, + "step": 39880 + }, + { + "epoch": 5.89, + "eval_loss": 0.9049265384674072, + "eval_runtime": 520.056, + "eval_samples_per_second": 14.689, + "eval_wer": 0.34169072872294803, + "step": 39880 + }, + { + "epoch": 5.9, + "learning_rate": 7.07566765578635e-06, + "loss": 1.0251, + "step": 39920 + }, + { + "epoch": 5.9, + "eval_loss": 0.9558963775634766, + "eval_runtime": 518.1895, + "eval_samples_per_second": 14.742, + "eval_wer": 0.34477829554875783, + "step": 39920 + }, + { + "epoch": 5.91, + "learning_rate": 7.072700296735906e-06, + "loss": 1.0107, + "step": 39960 + }, + { + "epoch": 5.91, + "eval_loss": 0.9357099533081055, + "eval_runtime": 518.2015, + "eval_samples_per_second": 14.741, + "eval_wer": 0.3440635810057463, + "step": 39960 + }, + { + "epoch": 5.91, + "learning_rate": 7.06973293768546e-06, + "loss": 1.0749, + "step": 40000 + }, + { + "epoch": 5.91, + "eval_loss": 0.9772769212722778, + "eval_runtime": 517.9622, + "eval_samples_per_second": 14.748, + "eval_wer": 0.34700820492295376, + "step": 40000 + }, + { + "epoch": 5.92, + "learning_rate": 7.066765578635016e-06, + "loss": 1.0755, + "step": 40040 + }, + { + "epoch": 5.92, + "eval_loss": 0.9932928681373596, + "eval_runtime": 518.6296, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3481517481917722, + "step": 40040 + }, + { + "epoch": 5.92, + "learning_rate": 7.06379821958457e-06, + "loss": 1.0321, + "step": 40080 + }, + { + "epoch": 5.92, + "eval_loss": 0.9989207983016968, + "eval_runtime": 519.0954, + "eval_samples_per_second": 14.716, + "eval_wer": 0.3480659824466108, + "step": 40080 + }, + { + "epoch": 5.93, + "learning_rate": 7.0608308605341245e-06, + "loss": 1.0955, + "step": 40120 + }, + { + "epoch": 5.93, + "eval_loss": 0.9509425163269043, + "eval_runtime": 518.7975, + "eval_samples_per_second": 14.724, + "eval_wer": 0.34283427199176647, + "step": 40120 + }, + { + "epoch": 5.94, + "learning_rate": 7.057863501483681e-06, + "loss": 1.1126, + "step": 40160 + }, + { + "epoch": 5.94, + "eval_loss": 0.9499536752700806, + "eval_runtime": 518.1865, + "eval_samples_per_second": 14.742, + "eval_wer": 0.3429772149003688, + "step": 40160 + }, + { + "epoch": 5.94, + "learning_rate": 7.054896142433235e-06, + "loss": 1.0296, + "step": 40200 + }, + { + "epoch": 5.94, + "eval_loss": 0.9404110312461853, + "eval_runtime": 522.2708, + "eval_samples_per_second": 14.627, + "eval_wer": 0.34214814603047544, + "step": 40200 + }, + { + "epoch": 5.95, + "learning_rate": 7.0519287833827895e-06, + "loss": 1.0119, + "step": 40240 + }, + { + "epoch": 5.95, + "eval_loss": 0.9105411767959595, + "eval_runtime": 517.3811, + "eval_samples_per_second": 14.765, + "eval_wer": 0.3399754138197204, + "step": 40240 + }, + { + "epoch": 5.95, + "learning_rate": 7.048961424332345e-06, + "loss": 1.0725, + "step": 40280 + }, + { + "epoch": 5.95, + "eval_loss": 0.9018839001655579, + "eval_runtime": 517.5906, + "eval_samples_per_second": 14.759, + "eval_wer": 0.3387461048057406, + "step": 40280 + }, + { + "epoch": 5.96, + "learning_rate": 7.045994065281899e-06, + "loss": 1.0227, + "step": 40320 + }, + { + "epoch": 5.96, + "eval_loss": 1.0091384649276733, + "eval_runtime": 517.5566, + "eval_samples_per_second": 14.76, + "eval_wer": 0.34746562223048116, + "step": 40320 + }, + { + "epoch": 5.97, + "learning_rate": 7.043026706231455e-06, + "loss": 1.1028, + "step": 40360 + }, + { + "epoch": 5.97, + "eval_loss": 0.9156641960144043, + "eval_runtime": 517.9703, + "eval_samples_per_second": 14.748, + "eval_wer": 0.3389462248777838, + "step": 40360 + }, + { + "epoch": 5.97, + "learning_rate": 7.04005934718101e-06, + "loss": 1.1154, + "step": 40400 + }, + { + "epoch": 5.97, + "eval_loss": 0.9069753885269165, + "eval_runtime": 517.4651, + "eval_samples_per_second": 14.762, + "eval_wer": 0.339203522113268, + "step": 40400 + }, + { + "epoch": 5.98, + "learning_rate": 7.037091988130564e-06, + "loss": 1.0093, + "step": 40440 + }, + { + "epoch": 5.98, + "eval_loss": 0.9869636297225952, + "eval_runtime": 518.4958, + "eval_samples_per_second": 14.733, + "eval_wer": 0.34597901598101716, + "step": 40440 + }, + { + "epoch": 5.98, + "learning_rate": 7.034124629080119e-06, + "loss": 1.0916, + "step": 40480 + }, + { + "epoch": 5.98, + "eval_loss": 0.9046074151992798, + "eval_runtime": 518.1892, + "eval_samples_per_second": 14.742, + "eval_wer": 0.339203522113268, + "step": 40480 + }, + { + "epoch": 5.99, + "learning_rate": 7.031157270029674e-06, + "loss": 0.9761, + "step": 40520 + }, + { + "epoch": 5.99, + "eval_loss": 0.9241064786911011, + "eval_runtime": 517.2973, + "eval_samples_per_second": 14.767, + "eval_wer": 0.3402041224734841, + "step": 40520 + }, + { + "epoch": 6.0, + "learning_rate": 7.028189910979229e-06, + "loss": 1.0169, + "step": 40560 + }, + { + "epoch": 6.0, + "eval_loss": 0.9792419075965881, + "eval_runtime": 521.3324, + "eval_samples_per_second": 14.653, + "eval_wer": 0.34454958689499415, + "step": 40560 + }, + { + "epoch": 6.0, + "learning_rate": 7.025222551928785e-06, + "loss": 0.9873, + "step": 40600 + }, + { + "epoch": 6.0, + "eval_loss": 0.9691166281700134, + "eval_runtime": 515.6011, + "eval_samples_per_second": 14.816, + "eval_wer": 0.34352039795305755, + "step": 40600 + }, + { + "epoch": 6.01, + "learning_rate": 7.022255192878339e-06, + "loss": 1.0519, + "step": 40640 + }, + { + "epoch": 6.01, + "eval_loss": 0.9410020112991333, + "eval_runtime": 517.2813, + "eval_samples_per_second": 14.768, + "eval_wer": 0.34069012836273194, + "step": 40640 + }, + { + "epoch": 6.01, + "learning_rate": 7.0192878338278935e-06, + "loss": 1.0277, + "step": 40680 + }, + { + "epoch": 6.01, + "eval_loss": 0.9421713948249817, + "eval_runtime": 521.4647, + "eval_samples_per_second": 14.649, + "eval_wer": 0.340632951199291, + "step": 40680 + }, + { + "epoch": 6.02, + "learning_rate": 7.016320474777448e-06, + "loss": 1.0479, + "step": 40720 + }, + { + "epoch": 6.02, + "eval_loss": 0.910408079624176, + "eval_runtime": 518.5275, + "eval_samples_per_second": 14.732, + "eval_wer": 0.3383744532433746, + "step": 40720 + }, + { + "epoch": 6.03, + "learning_rate": 7.013353115727004e-06, + "loss": 1.0779, + "step": 40760 + }, + { + "epoch": 6.03, + "eval_loss": 0.9029712080955505, + "eval_runtime": 517.0552, + "eval_samples_per_second": 14.774, + "eval_wer": 0.3383744532433746, + "step": 40760 + }, + { + "epoch": 6.03, + "learning_rate": 7.0103857566765585e-06, + "loss": 1.009, + "step": 40800 + }, + { + "epoch": 6.03, + "eval_loss": 0.9030901789665222, + "eval_runtime": 521.546, + "eval_samples_per_second": 14.647, + "eval_wer": 0.33857457331541785, + "step": 40800 + }, + { + "epoch": 6.04, + "learning_rate": 7.007418397626114e-06, + "loss": 1.0645, + "step": 40840 + }, + { + "epoch": 6.04, + "eval_loss": 0.9437246322631836, + "eval_runtime": 519.2316, + "eval_samples_per_second": 14.712, + "eval_wer": 0.3412333114154207, + "step": 40840 + }, + { + "epoch": 6.04, + "learning_rate": 7.004451038575668e-06, + "loss": 0.9416, + "step": 40880 + }, + { + "epoch": 6.04, + "eval_loss": 0.9512754082679749, + "eval_runtime": 516.6857, + "eval_samples_per_second": 14.785, + "eval_wer": 0.34086165985305467, + "step": 40880 + }, + { + "epoch": 6.05, + "learning_rate": 7.001483679525223e-06, + "loss": 1.0713, + "step": 40920 + }, + { + "epoch": 6.05, + "eval_loss": 0.9450889825820923, + "eval_runtime": 516.7587, + "eval_samples_per_second": 14.783, + "eval_wer": 0.34077589410789333, + "step": 40920 + }, + { + "epoch": 6.05, + "learning_rate": 6.998516320474777e-06, + "loss": 1.0321, + "step": 40960 + }, + { + "epoch": 6.05, + "eval_loss": 0.9223638772964478, + "eval_runtime": 515.8691, + "eval_samples_per_second": 14.808, + "eval_wer": 0.33940364218531116, + "step": 40960 + }, + { + "epoch": 6.06, + "learning_rate": 6.995548961424333e-06, + "loss": 1.0848, + "step": 41000 + }, + { + "epoch": 6.06, + "eval_loss": 0.8993661999702454, + "eval_runtime": 518.6874, + "eval_samples_per_second": 14.728, + "eval_wer": 0.3391749335315475, + "step": 41000 + }, + { + "epoch": 6.07, + "learning_rate": 6.992581602373888e-06, + "loss": 1.0208, + "step": 41040 + }, + { + "epoch": 6.07, + "eval_loss": 0.9573475122451782, + "eval_runtime": 519.1928, + "eval_samples_per_second": 14.713, + "eval_wer": 0.34223391177563683, + "step": 41040 + }, + { + "epoch": 6.07, + "learning_rate": 6.989614243323443e-06, + "loss": 1.0513, + "step": 41080 + }, + { + "epoch": 6.07, + "eval_loss": 0.921513557434082, + "eval_runtime": 516.8382, + "eval_samples_per_second": 14.78, + "eval_wer": 0.3400611795648818, + "step": 41080 + }, + { + "epoch": 6.08, + "learning_rate": 6.9866468842729974e-06, + "loss": 1.0306, + "step": 41120 + }, + { + "epoch": 6.08, + "eval_loss": 0.987941324710846, + "eval_runtime": 516.2368, + "eval_samples_per_second": 14.797, + "eval_wer": 0.34606478172617855, + "step": 41120 + }, + { + "epoch": 6.08, + "learning_rate": 6.983679525222552e-06, + "loss": 1.0857, + "step": 41160 + }, + { + "epoch": 6.08, + "eval_loss": 0.9013521075248718, + "eval_runtime": 516.5427, + "eval_samples_per_second": 14.789, + "eval_wer": 0.33994682523799996, + "step": 41160 + }, + { + "epoch": 6.09, + "learning_rate": 6.980712166172108e-06, + "loss": 0.9977, + "step": 41200 + }, + { + "epoch": 6.09, + "eval_loss": 0.9789462685585022, + "eval_runtime": 522.2177, + "eval_samples_per_second": 14.628, + "eval_wer": 0.34609337030789905, + "step": 41200 + }, + { + "epoch": 6.1, + "learning_rate": 6.9777448071216624e-06, + "loss": 1.0288, + "step": 41240 + }, + { + "epoch": 6.1, + "eval_loss": 0.9455281496047974, + "eval_runtime": 517.1743, + "eval_samples_per_second": 14.771, + "eval_wer": 0.3425197975928414, + "step": 41240 + }, + { + "epoch": 6.1, + "learning_rate": 6.974777448071217e-06, + "loss": 1.0803, + "step": 41280 + }, + { + "epoch": 6.1, + "eval_loss": 0.9269827604293823, + "eval_runtime": 515.7812, + "eval_samples_per_second": 14.811, + "eval_wer": 0.34111895708853884, + "step": 41280 + }, + { + "epoch": 6.11, + "learning_rate": 6.971810089020772e-06, + "loss": 1.0378, + "step": 41320 + }, + { + "epoch": 6.11, + "eval_loss": 1.0041701793670654, + "eval_runtime": 516.5476, + "eval_samples_per_second": 14.789, + "eval_wer": 0.3475513879756425, + "step": 41320 + }, + { + "epoch": 6.11, + "learning_rate": 6.968842729970327e-06, + "loss": 0.9954, + "step": 41360 + }, + { + "epoch": 6.11, + "eval_loss": 0.9570349454879761, + "eval_runtime": 517.3619, + "eval_samples_per_second": 14.765, + "eval_wer": 0.3438062837702622, + "step": 41360 + }, + { + "epoch": 6.12, + "learning_rate": 6.965875370919882e-06, + "loss": 1.042, + "step": 41400 + }, + { + "epoch": 6.12, + "eval_loss": 0.9941948056221008, + "eval_runtime": 518.552, + "eval_samples_per_second": 14.731, + "eval_wer": 0.34700820492295376, + "step": 41400 + }, + { + "epoch": 6.13, + "learning_rate": 6.962908011869437e-06, + "loss": 1.1212, + "step": 41440 + }, + { + "epoch": 6.13, + "eval_loss": 0.9493743181228638, + "eval_runtime": 518.4427, + "eval_samples_per_second": 14.735, + "eval_wer": 0.34323451213585293, + "step": 41440 + }, + { + "epoch": 6.13, + "learning_rate": 6.959940652818992e-06, + "loss": 1.1372, + "step": 41480 + }, + { + "epoch": 6.13, + "eval_loss": 0.9392896890640259, + "eval_runtime": 516.7765, + "eval_samples_per_second": 14.782, + "eval_wer": 0.3423482661025187, + "step": 41480 + }, + { + "epoch": 6.14, + "learning_rate": 6.956973293768546e-06, + "loss": 1.0569, + "step": 41520 + }, + { + "epoch": 6.14, + "eval_loss": 0.9607876539230347, + "eval_runtime": 516.5852, + "eval_samples_per_second": 14.787, + "eval_wer": 0.34514994711112384, + "step": 41520 + }, + { + "epoch": 6.14, + "learning_rate": 6.954005934718101e-06, + "loss": 1.0739, + "step": 41560 + }, + { + "epoch": 6.14, + "eval_loss": 0.9074859619140625, + "eval_runtime": 515.9911, + "eval_samples_per_second": 14.805, + "eval_wer": 0.3400611795648818, + "step": 41560 + }, + { + "epoch": 6.15, + "learning_rate": 6.951038575667657e-06, + "loss": 1.0102, + "step": 41600 + }, + { + "epoch": 6.15, + "eval_loss": 0.9402480721473694, + "eval_runtime": 517.6605, + "eval_samples_per_second": 14.757, + "eval_wer": 0.3420052031218731, + "step": 41600 + }, + { + "epoch": 6.16, + "learning_rate": 6.948071216617211e-06, + "loss": 1.02, + "step": 41640 + }, + { + "epoch": 6.16, + "eval_loss": 0.9796425104141235, + "eval_runtime": 516.4712, + "eval_samples_per_second": 14.791, + "eval_wer": 0.34557877583693075, + "step": 41640 + }, + { + "epoch": 6.16, + "learning_rate": 6.945103857566766e-06, + "loss": 0.996, + "step": 41680 + }, + { + "epoch": 6.16, + "eval_loss": 0.9304121732711792, + "eval_runtime": 516.5532, + "eval_samples_per_second": 14.788, + "eval_wer": 0.3403470653820864, + "step": 41680 + }, + { + "epoch": 6.17, + "learning_rate": 6.942136498516321e-06, + "loss": 1.0476, + "step": 41720 + }, + { + "epoch": 6.17, + "eval_loss": 0.9794661998748779, + "eval_runtime": 517.375, + "eval_samples_per_second": 14.765, + "eval_wer": 0.3441493467509077, + "step": 41720 + }, + { + "epoch": 6.17, + "learning_rate": 6.939169139465875e-06, + "loss": 0.9589, + "step": 41760 + }, + { + "epoch": 6.17, + "eval_loss": 0.9654977321624756, + "eval_runtime": 521.5458, + "eval_samples_per_second": 14.647, + "eval_wer": 0.3432916892992939, + "step": 41760 + }, + { + "epoch": 6.18, + "learning_rate": 6.936201780415431e-06, + "loss": 0.9957, + "step": 41800 + }, + { + "epoch": 6.18, + "eval_loss": 0.9798562526702881, + "eval_runtime": 517.9683, + "eval_samples_per_second": 14.748, + "eval_wer": 0.3441493467509077, + "step": 41800 + }, + { + "epoch": 6.18, + "learning_rate": 6.933234421364986e-06, + "loss": 1.1463, + "step": 41840 + }, + { + "epoch": 6.18, + "eval_loss": 0.9202159643173218, + "eval_runtime": 518.152, + "eval_samples_per_second": 14.743, + "eval_wer": 0.33891763629606336, + "step": 41840 + }, + { + "epoch": 6.19, + "learning_rate": 6.930267062314541e-06, + "loss": 1.07, + "step": 41880 + }, + { + "epoch": 6.19, + "eval_loss": 0.9690077304840088, + "eval_runtime": 520.9435, + "eval_samples_per_second": 14.664, + "eval_wer": 0.3430629806455302, + "step": 41880 + }, + { + "epoch": 6.2, + "learning_rate": 6.927299703264096e-06, + "loss": 1.023, + "step": 41920 + }, + { + "epoch": 6.2, + "eval_loss": 0.9628467559814453, + "eval_runtime": 517.708, + "eval_samples_per_second": 14.755, + "eval_wer": 0.3425197975928414, + "step": 41920 + }, + { + "epoch": 6.2, + "learning_rate": 6.92433234421365e-06, + "loss": 1.0004, + "step": 41960 + }, + { + "epoch": 6.2, + "eval_loss": 0.9805331230163574, + "eval_runtime": 518.171, + "eval_samples_per_second": 14.742, + "eval_wer": 0.343548986534778, + "step": 41960 + }, + { + "epoch": 6.21, + "learning_rate": 6.9213649851632045e-06, + "loss": 1.0844, + "step": 42000 + }, + { + "epoch": 6.21, + "eval_loss": 0.9469855427742004, + "eval_runtime": 522.3508, + "eval_samples_per_second": 14.624, + "eval_wer": 0.34154778581434575, + "step": 42000 + }, + { + "epoch": 6.21, + "learning_rate": 6.918397626112761e-06, + "loss": 0.9625, + "step": 42040 + }, + { + "epoch": 6.21, + "eval_loss": 0.9673171639442444, + "eval_runtime": 517.8628, + "eval_samples_per_second": 14.751, + "eval_wer": 0.34223391177563683, + "step": 42040 + }, + { + "epoch": 6.22, + "learning_rate": 6.915430267062315e-06, + "loss": 1.0274, + "step": 42080 + }, + { + "epoch": 6.22, + "eval_loss": 0.9865323901176453, + "eval_runtime": 517.5124, + "eval_samples_per_second": 14.761, + "eval_wer": 0.34409216958746675, + "step": 42080 + }, + { + "epoch": 6.23, + "learning_rate": 6.91246290801187e-06, + "loss": 1.044, + "step": 42120 + }, + { + "epoch": 6.23, + "eval_loss": 0.9777129888534546, + "eval_runtime": 518.9072, + "eval_samples_per_second": 14.721, + "eval_wer": 0.3434918093713371, + "step": 42120 + }, + { + "epoch": 6.23, + "learning_rate": 6.909495548961425e-06, + "loss": 1.0094, + "step": 42160 + }, + { + "epoch": 6.23, + "eval_loss": 1.011941909790039, + "eval_runtime": 516.7775, + "eval_samples_per_second": 14.782, + "eval_wer": 0.3466937305240287, + "step": 42160 + }, + { + "epoch": 6.24, + "learning_rate": 6.906528189910979e-06, + "loss": 0.9977, + "step": 42200 + }, + { + "epoch": 6.24, + "eval_loss": 0.9454556703567505, + "eval_runtime": 516.9242, + "eval_samples_per_second": 14.778, + "eval_wer": 0.34037565396380687, + "step": 42200 + }, + { + "epoch": 6.24, + "learning_rate": 6.903560830860535e-06, + "loss": 1.0309, + "step": 42240 + }, + { + "epoch": 6.24, + "eval_loss": 0.971244752407074, + "eval_runtime": 518.3394, + "eval_samples_per_second": 14.737, + "eval_wer": 0.34266274050144374, + "step": 42240 + }, + { + "epoch": 6.25, + "learning_rate": 6.90059347181009e-06, + "loss": 1.019, + "step": 42280 + }, + { + "epoch": 6.25, + "eval_loss": 0.9310616254806519, + "eval_runtime": 524.8015, + "eval_samples_per_second": 14.556, + "eval_wer": 0.33900340204122476, + "step": 42280 + }, + { + "epoch": 6.26, + "learning_rate": 6.897626112759644e-06, + "loss": 1.1068, + "step": 42320 + }, + { + "epoch": 6.26, + "eval_loss": 0.928028404712677, + "eval_runtime": 518.6251, + "eval_samples_per_second": 14.729, + "eval_wer": 0.33883187055090197, + "step": 42320 + }, + { + "epoch": 6.26, + "learning_rate": 6.8946587537091995e-06, + "loss": 1.0999, + "step": 42360 + }, + { + "epoch": 6.26, + "eval_loss": 0.9126626253128052, + "eval_runtime": 518.1049, + "eval_samples_per_second": 14.744, + "eval_wer": 0.33768832728208353, + "step": 42360 + }, + { + "epoch": 6.27, + "learning_rate": 6.891691394658754e-06, + "loss": 1.0794, + "step": 42400 + }, + { + "epoch": 6.27, + "eval_loss": 0.9294763207435608, + "eval_runtime": 518.4632, + "eval_samples_per_second": 14.734, + "eval_wer": 0.33863175047885874, + "step": 42400 + }, + { + "epoch": 6.27, + "learning_rate": 6.888724035608309e-06, + "loss": 1.008, + "step": 42440 + }, + { + "epoch": 6.27, + "eval_loss": 0.9695846438407898, + "eval_runtime": 518.8985, + "eval_samples_per_second": 14.722, + "eval_wer": 0.3422910889390777, + "step": 42440 + }, + { + "epoch": 6.28, + "learning_rate": 6.8857566765578645e-06, + "loss": 1.0936, + "step": 42480 + }, + { + "epoch": 6.28, + "eval_loss": 0.9167378544807434, + "eval_runtime": 517.8571, + "eval_samples_per_second": 14.751, + "eval_wer": 0.3386031618971383, + "step": 42480 + }, + { + "epoch": 6.29, + "learning_rate": 6.882789317507419e-06, + "loss": 1.01, + "step": 42520 + }, + { + "epoch": 6.29, + "eval_loss": 0.9675410389900208, + "eval_runtime": 519.4658, + "eval_samples_per_second": 14.705, + "eval_wer": 0.3428914491552074, + "step": 42520 + }, + { + "epoch": 6.29, + "learning_rate": 6.8798219584569734e-06, + "loss": 0.9894, + "step": 42560 + }, + { + "epoch": 6.29, + "eval_loss": 0.9569840431213379, + "eval_runtime": 517.6162, + "eval_samples_per_second": 14.758, + "eval_wer": 0.3420337917035936, + "step": 42560 + }, + { + "epoch": 6.3, + "learning_rate": 6.876854599406529e-06, + "loss": 1.0243, + "step": 42600 + }, + { + "epoch": 6.3, + "eval_loss": 0.9429008960723877, + "eval_runtime": 519.062, + "eval_samples_per_second": 14.717, + "eval_wer": 0.34060436261757054, + "step": 42600 + }, + { + "epoch": 6.3, + "learning_rate": 6.873887240356084e-06, + "loss": 1.0485, + "step": 42640 + }, + { + "epoch": 6.3, + "eval_loss": 0.9615535736083984, + "eval_runtime": 519.0683, + "eval_samples_per_second": 14.717, + "eval_wer": 0.3409188370164956, + "step": 42640 + }, + { + "epoch": 6.31, + "learning_rate": 6.8709198813056384e-06, + "loss": 1.069, + "step": 42680 + }, + { + "epoch": 6.31, + "eval_loss": 0.9468457102775574, + "eval_runtime": 519.9288, + "eval_samples_per_second": 14.692, + "eval_wer": 0.33971811658423623, + "step": 42680 + }, + { + "epoch": 6.31, + "learning_rate": 6.867952522255194e-06, + "loss": 1.0343, + "step": 42720 + }, + { + "epoch": 6.31, + "eval_loss": 1.0040969848632812, + "eval_runtime": 518.6041, + "eval_samples_per_second": 14.73, + "eval_wer": 0.3456645415820921, + "step": 42720 + }, + { + "epoch": 6.32, + "learning_rate": 6.864985163204748e-06, + "loss": 1.0297, + "step": 42760 + }, + { + "epoch": 6.32, + "eval_loss": 0.966876208782196, + "eval_runtime": 517.4717, + "eval_samples_per_second": 14.762, + "eval_wer": 0.34220532319391633, + "step": 42760 + }, + { + "epoch": 6.33, + "learning_rate": 6.862017804154303e-06, + "loss": 1.0307, + "step": 42800 + }, + { + "epoch": 6.33, + "eval_loss": 0.9051364064216614, + "eval_runtime": 517.9713, + "eval_samples_per_second": 14.748, + "eval_wer": 0.33863175047885874, + "step": 42800 + }, + { + "epoch": 6.33, + "learning_rate": 6.859050445103859e-06, + "loss": 1.0345, + "step": 42840 + }, + { + "epoch": 6.33, + "eval_loss": 0.9832961559295654, + "eval_runtime": 518.3968, + "eval_samples_per_second": 14.736, + "eval_wer": 0.34292003773692786, + "step": 42840 + }, + { + "epoch": 6.34, + "learning_rate": 6.856083086053413e-06, + "loss": 1.0445, + "step": 42880 + }, + { + "epoch": 6.34, + "eval_loss": 0.9443587064743042, + "eval_runtime": 522.9701, + "eval_samples_per_second": 14.607, + "eval_wer": 0.34023271105520453, + "step": 42880 + }, + { + "epoch": 6.34, + "learning_rate": 6.853115727002968e-06, + "loss": 1.0032, + "step": 42920 + }, + { + "epoch": 6.34, + "eval_loss": 0.9337226152420044, + "eval_runtime": 518.1668, + "eval_samples_per_second": 14.742, + "eval_wer": 0.33940364218531116, + "step": 42920 + }, + { + "epoch": 6.35, + "learning_rate": 6.850148367952523e-06, + "loss": 0.9917, + "step": 42960 + }, + { + "epoch": 6.35, + "eval_loss": 0.9697793126106262, + "eval_runtime": 518.5643, + "eval_samples_per_second": 14.731, + "eval_wer": 0.3422910889390777, + "step": 42960 + }, + { + "epoch": 6.36, + "learning_rate": 6.847181008902077e-06, + "loss": 1.0541, + "step": 43000 + }, + { + "epoch": 6.36, + "eval_loss": 0.9383385181427002, + "eval_runtime": 518.2591, + "eval_samples_per_second": 14.74, + "eval_wer": 0.33934646502187027, + "step": 43000 + }, + { + "epoch": 6.36, + "learning_rate": 6.844213649851632e-06, + "loss": 1.0121, + "step": 43040 + }, + { + "epoch": 6.36, + "eval_loss": 0.9556906223297119, + "eval_runtime": 517.8591, + "eval_samples_per_second": 14.751, + "eval_wer": 0.34137625432402297, + "step": 43040 + }, + { + "epoch": 6.37, + "learning_rate": 6.841246290801188e-06, + "loss": 1.0194, + "step": 43080 + }, + { + "epoch": 6.37, + "eval_loss": 0.9357848763465881, + "eval_runtime": 522.732, + "eval_samples_per_second": 14.614, + "eval_wer": 0.3400611795648818, + "step": 43080 + }, + { + "epoch": 6.37, + "learning_rate": 6.838278931750742e-06, + "loss": 1.0752, + "step": 43120 + }, + { + "epoch": 6.37, + "eval_loss": 0.9317259192466736, + "eval_runtime": 518.5919, + "eval_samples_per_second": 14.73, + "eval_wer": 0.34017553389176364, + "step": 43120 + }, + { + "epoch": 6.38, + "learning_rate": 6.835311572700297e-06, + "loss": 0.9962, + "step": 43160 + }, + { + "epoch": 6.38, + "eval_loss": 0.921172022819519, + "eval_runtime": 519.9838, + "eval_samples_per_second": 14.691, + "eval_wer": 0.3395465850939135, + "step": 43160 + }, + { + "epoch": 6.39, + "learning_rate": 6.832344213649852e-06, + "loss": 0.9713, + "step": 43200 + }, + { + "epoch": 6.39, + "eval_loss": 1.02538001537323, + "eval_runtime": 519.1476, + "eval_samples_per_second": 14.715, + "eval_wer": 0.34743703364876066, + "step": 43200 + }, + { + "epoch": 6.39, + "learning_rate": 6.8293768545994066e-06, + "loss": 1.0604, + "step": 43240 + }, + { + "epoch": 6.39, + "eval_loss": 0.9435226917266846, + "eval_runtime": 517.7959, + "eval_samples_per_second": 14.753, + "eval_wer": 0.3408330712713342, + "step": 43240 + }, + { + "epoch": 6.4, + "learning_rate": 6.826409495548963e-06, + "loss": 1.03, + "step": 43280 + }, + { + "epoch": 6.4, + "eval_loss": 0.9553525447845459, + "eval_runtime": 518.1428, + "eval_samples_per_second": 14.743, + "eval_wer": 0.34169072872294803, + "step": 43280 + }, + { + "epoch": 6.4, + "learning_rate": 6.823442136498517e-06, + "loss": 1.1079, + "step": 43320 + }, + { + "epoch": 6.4, + "eval_loss": 0.9466567635536194, + "eval_runtime": 518.7209, + "eval_samples_per_second": 14.727, + "eval_wer": 0.3409188370164956, + "step": 43320 + }, + { + "epoch": 6.41, + "learning_rate": 6.820474777448072e-06, + "loss": 1.1803, + "step": 43360 + }, + { + "epoch": 6.41, + "eval_loss": 0.9495853185653687, + "eval_runtime": 518.6396, + "eval_samples_per_second": 14.729, + "eval_wer": 0.34169072872294803, + "step": 43360 + }, + { + "epoch": 6.42, + "learning_rate": 6.817507418397626e-06, + "loss": 1.0215, + "step": 43400 + }, + { + "epoch": 6.42, + "eval_loss": 0.961620032787323, + "eval_runtime": 518.8643, + "eval_samples_per_second": 14.723, + "eval_wer": 0.3425197975928414, + "step": 43400 + }, + { + "epoch": 6.42, + "learning_rate": 6.814540059347181e-06, + "loss": 1.0191, + "step": 43440 + }, + { + "epoch": 6.42, + "eval_loss": 0.9567356705665588, + "eval_runtime": 517.3036, + "eval_samples_per_second": 14.767, + "eval_wer": 0.34169072872294803, + "step": 43440 + }, + { + "epoch": 6.43, + "learning_rate": 6.811572700296737e-06, + "loss": 1.0319, + "step": 43480 + }, + { + "epoch": 6.43, + "eval_loss": 0.9249156713485718, + "eval_runtime": 523.4836, + "eval_samples_per_second": 14.593, + "eval_wer": 0.3390319906229452, + "step": 43480 + }, + { + "epoch": 6.43, + "learning_rate": 6.808605341246292e-06, + "loss": 1.1725, + "step": 43520 + }, + { + "epoch": 6.43, + "eval_loss": 0.9146840572357178, + "eval_runtime": 518.3718, + "eval_samples_per_second": 14.737, + "eval_wer": 0.337716915863804, + "step": 43520 + }, + { + "epoch": 6.44, + "learning_rate": 6.805637982195846e-06, + "loss": 1.0391, + "step": 43560 + }, + { + "epoch": 6.44, + "eval_loss": 0.9810061454772949, + "eval_runtime": 518.023, + "eval_samples_per_second": 14.746, + "eval_wer": 0.3430343920638097, + "step": 43560 + }, + { + "epoch": 6.44, + "learning_rate": 6.802670623145401e-06, + "loss": 1.0273, + "step": 43600 + }, + { + "epoch": 6.44, + "eval_loss": 0.94829922914505, + "eval_runtime": 518.078, + "eval_samples_per_second": 14.745, + "eval_wer": 0.3400325909831613, + "step": 43600 + }, + { + "epoch": 6.45, + "learning_rate": 6.799703264094955e-06, + "loss": 1.085, + "step": 43640 + }, + { + "epoch": 6.45, + "eval_loss": 0.9405030012130737, + "eval_runtime": 518.6662, + "eval_samples_per_second": 14.728, + "eval_wer": 0.3393750536035907, + "step": 43640 + }, + { + "epoch": 6.46, + "learning_rate": 6.796735905044511e-06, + "loss": 1.058, + "step": 43680 + }, + { + "epoch": 6.46, + "eval_loss": 0.8849182724952698, + "eval_runtime": 519.2054, + "eval_samples_per_second": 14.713, + "eval_wer": 0.3377740930272449, + "step": 43680 + }, + { + "epoch": 6.46, + "learning_rate": 6.793768545994066e-06, + "loss": 1.0516, + "step": 43720 + }, + { + "epoch": 6.46, + "eval_loss": 0.9168864488601685, + "eval_runtime": 519.7074, + "eval_samples_per_second": 14.699, + "eval_wer": 0.3393178764401498, + "step": 43720 + }, + { + "epoch": 6.47, + "learning_rate": 6.790801186943621e-06, + "loss": 1.0637, + "step": 43760 + }, + { + "epoch": 6.47, + "eval_loss": 0.960401713848114, + "eval_runtime": 518.1763, + "eval_samples_per_second": 14.742, + "eval_wer": 0.34309156922725065, + "step": 43760 + }, + { + "epoch": 6.47, + "learning_rate": 6.7878338278931755e-06, + "loss": 1.0477, + "step": 43800 + }, + { + "epoch": 6.47, + "eval_loss": 0.9503666758537292, + "eval_runtime": 518.3112, + "eval_samples_per_second": 14.738, + "eval_wer": 0.3421767346121959, + "step": 43800 + }, + { + "epoch": 6.48, + "learning_rate": 6.78486646884273e-06, + "loss": 1.0153, + "step": 43840 + }, + { + "epoch": 6.48, + "eval_loss": 0.9432001113891602, + "eval_runtime": 519.7204, + "eval_samples_per_second": 14.698, + "eval_wer": 0.34074730552617283, + "step": 43840 + }, + { + "epoch": 6.49, + "learning_rate": 6.781899109792286e-06, + "loss": 1.1138, + "step": 43880 + }, + { + "epoch": 6.49, + "eval_loss": 0.9068188071250916, + "eval_runtime": 523.8466, + "eval_samples_per_second": 14.583, + "eval_wer": 0.33857457331541785, + "step": 43880 + }, + { + "epoch": 6.49, + "learning_rate": 6.7789317507418406e-06, + "loss": 0.9856, + "step": 43920 + }, + { + "epoch": 6.49, + "eval_loss": 0.9475705027580261, + "eval_runtime": 519.1655, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3408044826896138, + "step": 43920 + }, + { + "epoch": 6.5, + "learning_rate": 6.775964391691395e-06, + "loss": 1.0439, + "step": 43960 + }, + { + "epoch": 6.5, + "eval_loss": 0.9484663009643555, + "eval_runtime": 518.1354, + "eval_samples_per_second": 14.743, + "eval_wer": 0.3400325909831613, + "step": 43960 + }, + { + "epoch": 6.5, + "learning_rate": 6.77299703264095e-06, + "loss": 1.0584, + "step": 44000 + }, + { + "epoch": 6.5, + "eval_loss": 0.9141130447387695, + "eval_runtime": 518.0944, + "eval_samples_per_second": 14.744, + "eval_wer": 0.33811715600789044, + "step": 44000 + }, + { + "epoch": 6.51, + "learning_rate": 6.770029673590505e-06, + "loss": 1.0235, + "step": 44040 + }, + { + "epoch": 6.51, + "eval_loss": 0.9584606289863586, + "eval_runtime": 518.3269, + "eval_samples_per_second": 14.738, + "eval_wer": 0.34111895708853884, + "step": 44040 + }, + { + "epoch": 6.52, + "learning_rate": 6.767062314540059e-06, + "loss": 1.0065, + "step": 44080 + }, + { + "epoch": 6.52, + "eval_loss": 0.958109974861145, + "eval_runtime": 518.2683, + "eval_samples_per_second": 14.739, + "eval_wer": 0.3404900082906887, + "step": 44080 + }, + { + "epoch": 6.52, + "learning_rate": 6.764094955489615e-06, + "loss": 1.0187, + "step": 44120 + }, + { + "epoch": 6.52, + "eval_loss": 0.9575849175453186, + "eval_runtime": 520.5418, + "eval_samples_per_second": 14.675, + "eval_wer": 0.34008976814660224, + "step": 44120 + }, + { + "epoch": 6.53, + "learning_rate": 6.76112759643917e-06, + "loss": 1.0077, + "step": 44160 + }, + { + "epoch": 6.53, + "eval_loss": 0.9747424721717834, + "eval_runtime": 518.9236, + "eval_samples_per_second": 14.721, + "eval_wer": 0.3414334314874639, + "step": 44160 + }, + { + "epoch": 6.53, + "learning_rate": 6.758160237388724e-06, + "loss": 1.048, + "step": 44200 + }, + { + "epoch": 6.53, + "eval_loss": 0.9795682430267334, + "eval_runtime": 517.1776, + "eval_samples_per_second": 14.771, + "eval_wer": 0.3418336716315504, + "step": 44200 + }, + { + "epoch": 6.54, + "learning_rate": 6.7551928783382795e-06, + "loss": 1.0524, + "step": 44240 + }, + { + "epoch": 6.54, + "eval_loss": 0.9583014845848083, + "eval_runtime": 516.3226, + "eval_samples_per_second": 14.795, + "eval_wer": 0.34000400240144085, + "step": 44240 + }, + { + "epoch": 6.55, + "learning_rate": 6.752225519287834e-06, + "loss": 1.0444, + "step": 44280 + }, + { + "epoch": 6.55, + "eval_loss": 0.9812473058700562, + "eval_runtime": 520.4978, + "eval_samples_per_second": 14.676, + "eval_wer": 0.34309156922725065, + "step": 44280 + }, + { + "epoch": 6.55, + "learning_rate": 6.74925816023739e-06, + "loss": 1.0567, + "step": 44320 + }, + { + "epoch": 6.55, + "eval_loss": 0.9156949520111084, + "eval_runtime": 517.3354, + "eval_samples_per_second": 14.766, + "eval_wer": 0.338774693387461, + "step": 44320 + }, + { + "epoch": 6.56, + "learning_rate": 6.7462908011869445e-06, + "loss": 0.999, + "step": 44360 + }, + { + "epoch": 6.56, + "eval_loss": 0.9418641328811646, + "eval_runtime": 517.4578, + "eval_samples_per_second": 14.763, + "eval_wer": 0.34074730552617283, + "step": 44360 + }, + { + "epoch": 6.56, + "learning_rate": 6.743323442136499e-06, + "loss": 0.9938, + "step": 44400 + }, + { + "epoch": 6.56, + "eval_loss": 0.9844051599502563, + "eval_runtime": 521.3306, + "eval_samples_per_second": 14.653, + "eval_wer": 0.3438062837702622, + "step": 44400 + }, + { + "epoch": 6.57, + "learning_rate": 6.740356083086053e-06, + "loss": 1.0065, + "step": 44440 + }, + { + "epoch": 6.57, + "eval_loss": 0.9740300178527832, + "eval_runtime": 517.4671, + "eval_samples_per_second": 14.762, + "eval_wer": 0.3426055633380028, + "step": 44440 + }, + { + "epoch": 6.57, + "learning_rate": 6.737388724035609e-06, + "loss": 1.0867, + "step": 44480 + }, + { + "epoch": 6.57, + "eval_loss": 0.9628952145576477, + "eval_runtime": 517.7074, + "eval_samples_per_second": 14.755, + "eval_wer": 0.34191943737671177, + "step": 44480 + }, + { + "epoch": 6.58, + "learning_rate": 6.734421364985164e-06, + "loss": 1.0295, + "step": 44520 + }, + { + "epoch": 6.58, + "eval_loss": 0.9897034168243408, + "eval_runtime": 521.6065, + "eval_samples_per_second": 14.645, + "eval_wer": 0.34412075816918725, + "step": 44520 + }, + { + "epoch": 6.59, + "learning_rate": 6.731454005934719e-06, + "loss": 1.0346, + "step": 44560 + }, + { + "epoch": 6.59, + "eval_loss": 0.9870888590812683, + "eval_runtime": 517.8054, + "eval_samples_per_second": 14.753, + "eval_wer": 0.34394922667886446, + "step": 44560 + }, + { + "epoch": 6.59, + "learning_rate": 6.728486646884274e-06, + "loss": 1.0326, + "step": 44600 + }, + { + "epoch": 6.59, + "eval_loss": 0.9788744449615479, + "eval_runtime": 517.8163, + "eval_samples_per_second": 14.752, + "eval_wer": 0.3433202778810143, + "step": 44600 + }, + { + "epoch": 6.6, + "learning_rate": 6.725519287833828e-06, + "loss": 1.0822, + "step": 44640 + }, + { + "epoch": 6.6, + "eval_loss": 0.9938949942588806, + "eval_runtime": 517.902, + "eval_samples_per_second": 14.75, + "eval_wer": 0.34386346093370307, + "step": 44640 + }, + { + "epoch": 6.6, + "learning_rate": 6.7225519287833826e-06, + "loss": 1.0568, + "step": 44680 + }, + { + "epoch": 6.6, + "eval_loss": 0.9342981576919556, + "eval_runtime": 518.1786, + "eval_samples_per_second": 14.742, + "eval_wer": 0.3385173961519769, + "step": 44680 + }, + { + "epoch": 6.61, + "learning_rate": 6.719584569732939e-06, + "loss": 0.9838, + "step": 44720 + }, + { + "epoch": 6.61, + "eval_loss": 0.9663140177726746, + "eval_runtime": 518.3797, + "eval_samples_per_second": 14.736, + "eval_wer": 0.3413476657423025, + "step": 44720 + }, + { + "epoch": 6.62, + "learning_rate": 6.716617210682493e-06, + "loss": 1.0952, + "step": 44760 + }, + { + "epoch": 6.62, + "eval_loss": 0.9758021235466003, + "eval_runtime": 516.4551, + "eval_samples_per_second": 14.791, + "eval_wer": 0.3420337917035936, + "step": 44760 + }, + { + "epoch": 6.62, + "learning_rate": 6.7136498516320484e-06, + "loss": 1.0537, + "step": 44800 + }, + { + "epoch": 6.62, + "eval_loss": 0.9853593707084656, + "eval_runtime": 522.57, + "eval_samples_per_second": 14.618, + "eval_wer": 0.34274850624660513, + "step": 44800 + }, + { + "epoch": 6.63, + "learning_rate": 6.710682492581603e-06, + "loss": 1.0639, + "step": 44840 + }, + { + "epoch": 6.63, + "eval_loss": 0.8960084319114685, + "eval_runtime": 518.0484, + "eval_samples_per_second": 14.746, + "eval_wer": 0.33651619543154465, + "step": 44840 + }, + { + "epoch": 6.63, + "learning_rate": 6.707715133531157e-06, + "loss": 1.0678, + "step": 44880 + }, + { + "epoch": 6.63, + "eval_loss": 0.9075257182121277, + "eval_runtime": 517.6036, + "eval_samples_per_second": 14.758, + "eval_wer": 0.3381457445896109, + "step": 44880 + }, + { + "epoch": 6.64, + "learning_rate": 6.7047477744807135e-06, + "loss": 1.0031, + "step": 44920 + }, + { + "epoch": 6.64, + "eval_loss": 1.013589859008789, + "eval_runtime": 523.3629, + "eval_samples_per_second": 14.596, + "eval_wer": 0.3447497069670374, + "step": 44920 + }, + { + "epoch": 6.65, + "learning_rate": 6.701780415430268e-06, + "loss": 1.0413, + "step": 44960 + }, + { + "epoch": 6.65, + "eval_loss": 0.9521129131317139, + "eval_runtime": 518.4933, + "eval_samples_per_second": 14.733, + "eval_wer": 0.34069012836273194, + "step": 44960 + }, + { + "epoch": 6.65, + "learning_rate": 6.698813056379822e-06, + "loss": 1.0565, + "step": 45000 + }, + { + "epoch": 6.65, + "eval_loss": 0.909016489982605, + "eval_runtime": 518.0621, + "eval_samples_per_second": 14.745, + "eval_wer": 0.3374024414648789, + "step": 45000 + }, + { + "epoch": 6.66, + "learning_rate": 6.695845697329378e-06, + "loss": 1.0887, + "step": 45040 + }, + { + "epoch": 6.66, + "eval_loss": 0.964550256729126, + "eval_runtime": 518.2674, + "eval_samples_per_second": 14.739, + "eval_wer": 0.3411475456702593, + "step": 45040 + }, + { + "epoch": 6.66, + "learning_rate": 6.692878338278932e-06, + "loss": 0.9852, + "step": 45080 + }, + { + "epoch": 6.66, + "eval_loss": 0.9912906885147095, + "eval_runtime": 519.6398, + "eval_samples_per_second": 14.701, + "eval_wer": 0.3426913290831642, + "step": 45080 + }, + { + "epoch": 6.67, + "learning_rate": 6.6899109792284865e-06, + "loss": 1.1365, + "step": 45120 + }, + { + "epoch": 6.67, + "eval_loss": 0.9597486257553101, + "eval_runtime": 518.314, + "eval_samples_per_second": 14.738, + "eval_wer": 0.3413190771605821, + "step": 45120 + }, + { + "epoch": 6.68, + "learning_rate": 6.686943620178043e-06, + "loss": 1.0144, + "step": 45160 + }, + { + "epoch": 6.68, + "eval_loss": 0.9832190871238708, + "eval_runtime": 522.2911, + "eval_samples_per_second": 14.626, + "eval_wer": 0.34257697475628235, + "step": 45160 + }, + { + "epoch": 6.68, + "learning_rate": 6.683976261127597e-06, + "loss": 1.0565, + "step": 45200 + }, + { + "epoch": 6.68, + "eval_loss": 0.9541497826576233, + "eval_runtime": 519.8354, + "eval_samples_per_second": 14.695, + "eval_wer": 0.3405757740358501, + "step": 45200 + }, + { + "epoch": 6.69, + "learning_rate": 6.6810089020771515e-06, + "loss": 0.9186, + "step": 45240 + }, + { + "epoch": 6.69, + "eval_loss": 0.9848554730415344, + "eval_runtime": 520.4819, + "eval_samples_per_second": 14.677, + "eval_wer": 0.3425483861745619, + "step": 45240 + }, + { + "epoch": 6.69, + "learning_rate": 6.678041543026707e-06, + "loss": 1.0164, + "step": 45280 + }, + { + "epoch": 6.69, + "eval_loss": 0.938230574131012, + "eval_runtime": 519.5555, + "eval_samples_per_second": 14.703, + "eval_wer": 0.3390319906229452, + "step": 45280 + }, + { + "epoch": 6.7, + "learning_rate": 6.675074183976261e-06, + "loss": 1.0202, + "step": 45320 + }, + { + "epoch": 6.7, + "eval_loss": 0.9416821002960205, + "eval_runtime": 518.3366, + "eval_samples_per_second": 14.738, + "eval_wer": 0.3393178764401498, + "step": 45320 + }, + { + "epoch": 6.71, + "learning_rate": 6.6721068249258166e-06, + "loss": 1.0134, + "step": 45360 + }, + { + "epoch": 6.71, + "eval_loss": 0.9644172787666321, + "eval_runtime": 523.4715, + "eval_samples_per_second": 14.593, + "eval_wer": 0.34140484290574347, + "step": 45360 + }, + { + "epoch": 6.71, + "learning_rate": 6.669139465875372e-06, + "loss": 0.9914, + "step": 45400 + }, + { + "epoch": 6.71, + "eval_loss": 0.9629830718040466, + "eval_runtime": 519.1756, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3414334314874639, + "step": 45400 + }, + { + "epoch": 6.72, + "learning_rate": 6.666172106824926e-06, + "loss": 1.0576, + "step": 45440 + }, + { + "epoch": 6.72, + "eval_loss": 0.9839049577713013, + "eval_runtime": 518.7516, + "eval_samples_per_second": 14.726, + "eval_wer": 0.3422910889390777, + "step": 45440 + }, + { + "epoch": 6.72, + "learning_rate": 6.663204747774481e-06, + "loss": 0.9965, + "step": 45480 + }, + { + "epoch": 6.72, + "eval_loss": 1.0161035060882568, + "eval_runtime": 518.3264, + "eval_samples_per_second": 14.738, + "eval_wer": 0.3447211183853169, + "step": 45480 + }, + { + "epoch": 6.73, + "learning_rate": 6.660237388724036e-06, + "loss": 1.0222, + "step": 45520 + }, + { + "epoch": 6.73, + "eval_loss": 0.957398533821106, + "eval_runtime": 519.2192, + "eval_samples_per_second": 14.712, + "eval_wer": 0.3403184768003659, + "step": 45520 + }, + { + "epoch": 6.73, + "learning_rate": 6.657270029673591e-06, + "loss": 1.1072, + "step": 45560 + }, + { + "epoch": 6.73, + "eval_loss": 0.9424870014190674, + "eval_runtime": 518.7634, + "eval_samples_per_second": 14.725, + "eval_wer": 0.33923211069498843, + "step": 45560 + }, + { + "epoch": 6.74, + "learning_rate": 6.654302670623146e-06, + "loss": 1.0581, + "step": 45600 + }, + { + "epoch": 6.74, + "eval_loss": 0.9570872187614441, + "eval_runtime": 519.1419, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3400325909831613, + "step": 45600 + }, + { + "epoch": 6.75, + "learning_rate": 6.651335311572701e-06, + "loss": 1.0767, + "step": 45640 + }, + { + "epoch": 6.75, + "eval_loss": 0.9220086932182312, + "eval_runtime": 517.5198, + "eval_samples_per_second": 14.761, + "eval_wer": 0.3387461048057406, + "step": 45640 + }, + { + "epoch": 6.75, + "learning_rate": 6.6483679525222555e-06, + "loss": 1.0343, + "step": 45680 + }, + { + "epoch": 6.75, + "eval_loss": 0.9139286279678345, + "eval_runtime": 518.6234, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3381743331713314, + "step": 45680 + }, + { + "epoch": 6.76, + "learning_rate": 6.64540059347181e-06, + "loss": 1.0768, + "step": 45720 + }, + { + "epoch": 6.76, + "eval_loss": 0.9151127338409424, + "eval_runtime": 517.7128, + "eval_samples_per_second": 14.755, + "eval_wer": 0.3381457445896109, + "step": 45720 + }, + { + "epoch": 6.76, + "learning_rate": 6.642433234421366e-06, + "loss": 1.0666, + "step": 45760 + }, + { + "epoch": 6.76, + "eval_loss": 0.9325342178344727, + "eval_runtime": 519.9459, + "eval_samples_per_second": 14.692, + "eval_wer": 0.3388032819691815, + "step": 45760 + }, + { + "epoch": 6.77, + "learning_rate": 6.6394658753709205e-06, + "loss": 1.0676, + "step": 45800 + }, + { + "epoch": 6.77, + "eval_loss": 0.9377098679542542, + "eval_runtime": 518.7451, + "eval_samples_per_second": 14.726, + "eval_wer": 0.3390891677863861, + "step": 45800 + }, + { + "epoch": 6.78, + "learning_rate": 6.636498516320476e-06, + "loss": 1.0083, + "step": 45840 + }, + { + "epoch": 6.78, + "eval_loss": 0.9412100911140442, + "eval_runtime": 519.2326, + "eval_samples_per_second": 14.712, + "eval_wer": 0.3393750536035907, + "step": 45840 + }, + { + "epoch": 6.78, + "learning_rate": 6.63353115727003e-06, + "loss": 1.0513, + "step": 45880 + }, + { + "epoch": 6.78, + "eval_loss": 0.9039720296859741, + "eval_runtime": 518.7173, + "eval_samples_per_second": 14.727, + "eval_wer": 0.336973612739072, + "step": 45880 + }, + { + "epoch": 6.79, + "learning_rate": 6.630563798219585e-06, + "loss": 0.9818, + "step": 45920 + }, + { + "epoch": 6.79, + "eval_loss": 0.9661240577697754, + "eval_runtime": 522.5932, + "eval_samples_per_second": 14.617, + "eval_wer": 0.34051859687240915, + "step": 45920 + }, + { + "epoch": 6.79, + "learning_rate": 6.627596439169141e-06, + "loss": 1.0533, + "step": 45960 + }, + { + "epoch": 6.79, + "eval_loss": 1.0201531648635864, + "eval_runtime": 518.0421, + "eval_samples_per_second": 14.746, + "eval_wer": 0.34520712427456474, + "step": 45960 + }, + { + "epoch": 6.8, + "learning_rate": 6.624629080118695e-06, + "loss": 0.975, + "step": 46000 + }, + { + "epoch": 6.8, + "eval_loss": 0.9392632842063904, + "eval_runtime": 519.2717, + "eval_samples_per_second": 14.711, + "eval_wer": 0.3382886874982132, + "step": 46000 + }, + { + "epoch": 6.81, + "learning_rate": 6.62166172106825e-06, + "loss": 1.02, + "step": 46040 + }, + { + "epoch": 6.81, + "eval_loss": 0.9480339288711548, + "eval_runtime": 522.5189, + "eval_samples_per_second": 14.62, + "eval_wer": 0.3386603390605792, + "step": 46040 + }, + { + "epoch": 6.81, + "learning_rate": 6.618694362017805e-06, + "loss": 0.9493, + "step": 46080 + }, + { + "epoch": 6.81, + "eval_loss": 1.0074026584625244, + "eval_runtime": 518.4386, + "eval_samples_per_second": 14.735, + "eval_wer": 0.3437776951885417, + "step": 46080 + }, + { + "epoch": 6.82, + "learning_rate": 6.615727002967359e-06, + "loss": 1.1311, + "step": 46120 + }, + { + "epoch": 6.82, + "eval_loss": 0.9043002128601074, + "eval_runtime": 518.6771, + "eval_samples_per_second": 14.728, + "eval_wer": 0.3366877269218674, + "step": 46120 + }, + { + "epoch": 6.82, + "learning_rate": 6.612759643916914e-06, + "loss": 0.9729, + "step": 46160 + }, + { + "epoch": 6.82, + "eval_loss": 0.9258018136024475, + "eval_runtime": 519.2236, + "eval_samples_per_second": 14.712, + "eval_wer": 0.3378598587724063, + "step": 46160 + }, + { + "epoch": 6.83, + "learning_rate": 6.60979228486647e-06, + "loss": 1.0414, + "step": 46200 + }, + { + "epoch": 6.83, + "eval_loss": 0.9422390460968018, + "eval_runtime": 518.6072, + "eval_samples_per_second": 14.73, + "eval_wer": 0.3381743331713314, + "step": 46200 + }, + { + "epoch": 6.84, + "learning_rate": 6.6068249258160244e-06, + "loss": 1.0492, + "step": 46240 + }, + { + "epoch": 6.84, + "eval_loss": 0.9531782269477844, + "eval_runtime": 517.7381, + "eval_samples_per_second": 14.755, + "eval_wer": 0.33923211069498843, + "step": 46240 + }, + { + "epoch": 6.84, + "learning_rate": 6.603857566765579e-06, + "loss": 0.958, + "step": 46280 + }, + { + "epoch": 6.84, + "eval_loss": 0.9989124536514282, + "eval_runtime": 520.5664, + "eval_samples_per_second": 14.674, + "eval_wer": 0.34249120901112096, + "step": 46280 + }, + { + "epoch": 6.85, + "learning_rate": 6.600890207715134e-06, + "loss": 1.0856, + "step": 46320 + }, + { + "epoch": 6.85, + "eval_loss": 0.924593985080719, + "eval_runtime": 520.454, + "eval_samples_per_second": 14.678, + "eval_wer": 0.33788844735412676, + "step": 46320 + }, + { + "epoch": 6.85, + "learning_rate": 6.597922848664689e-06, + "loss": 1.0448, + "step": 46360 + }, + { + "epoch": 6.85, + "eval_loss": 0.9174411296844482, + "eval_runtime": 517.9496, + "eval_samples_per_second": 14.749, + "eval_wer": 0.33803139026272905, + "step": 46360 + }, + { + "epoch": 6.86, + "learning_rate": 6.594955489614244e-06, + "loss": 1.0445, + "step": 46400 + }, + { + "epoch": 6.86, + "eval_loss": 0.9239253997802734, + "eval_runtime": 519.913, + "eval_samples_per_second": 14.693, + "eval_wer": 0.3385173961519769, + "step": 46400 + }, + { + "epoch": 6.86, + "learning_rate": 6.591988130563799e-06, + "loss": 1.0004, + "step": 46440 + }, + { + "epoch": 6.86, + "eval_loss": 0.9684176445007324, + "eval_runtime": 523.3474, + "eval_samples_per_second": 14.596, + "eval_wer": 0.3415191972326253, + "step": 46440 + }, + { + "epoch": 6.87, + "learning_rate": 6.589020771513354e-06, + "loss": 1.0123, + "step": 46480 + }, + { + "epoch": 6.87, + "eval_loss": 0.9655300378799438, + "eval_runtime": 518.9509, + "eval_samples_per_second": 14.72, + "eval_wer": 0.34120472283370024, + "step": 46480 + }, + { + "epoch": 6.88, + "learning_rate": 6.586053412462908e-06, + "loss": 1.0529, + "step": 46520 + }, + { + "epoch": 6.88, + "eval_loss": 0.958466649055481, + "eval_runtime": 519.6052, + "eval_samples_per_second": 14.702, + "eval_wer": 0.34103319134337745, + "step": 46520 + }, + { + "epoch": 6.88, + "learning_rate": 6.583086053412463e-06, + "loss": 1.0228, + "step": 46560 + }, + { + "epoch": 6.88, + "eval_loss": 0.9584649205207825, + "eval_runtime": 519.5145, + "eval_samples_per_second": 14.704, + "eval_wer": 0.34117613425197973, + "step": 46560 + }, + { + "epoch": 6.89, + "learning_rate": 6.580118694362019e-06, + "loss": 1.0198, + "step": 46600 + }, + { + "epoch": 6.89, + "eval_loss": 0.9663130640983582, + "eval_runtime": 519.6186, + "eval_samples_per_second": 14.701, + "eval_wer": 0.3418336716315504, + "step": 46600 + }, + { + "epoch": 6.89, + "learning_rate": 6.577151335311573e-06, + "loss": 0.9848, + "step": 46640 + }, + { + "epoch": 6.89, + "eval_loss": 0.9407705664634705, + "eval_runtime": 519.2767, + "eval_samples_per_second": 14.711, + "eval_wer": 0.339203522113268, + "step": 46640 + }, + { + "epoch": 6.9, + "learning_rate": 6.574183976261128e-06, + "loss": 0.9942, + "step": 46680 + }, + { + "epoch": 6.9, + "eval_loss": 0.9171158075332642, + "eval_runtime": 519.4529, + "eval_samples_per_second": 14.706, + "eval_wer": 0.3378598587724063, + "step": 46680 + }, + { + "epoch": 6.91, + "learning_rate": 6.571216617210683e-06, + "loss": 1.0639, + "step": 46720 + }, + { + "epoch": 6.91, + "eval_loss": 0.9592843055725098, + "eval_runtime": 519.8172, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3396323508390749, + "step": 46720 + }, + { + "epoch": 6.91, + "learning_rate": 6.568249258160237e-06, + "loss": 1.0263, + "step": 46760 + }, + { + "epoch": 6.91, + "eval_loss": 0.9080811738967896, + "eval_runtime": 518.3733, + "eval_samples_per_second": 14.736, + "eval_wer": 0.3372594985562766, + "step": 46760 + }, + { + "epoch": 6.92, + "learning_rate": 6.565281899109793e-06, + "loss": 1.0246, + "step": 46800 + }, + { + "epoch": 6.92, + "eval_loss": 0.9387766718864441, + "eval_runtime": 518.7265, + "eval_samples_per_second": 14.726, + "eval_wer": 0.33863175047885874, + "step": 46800 + }, + { + "epoch": 6.92, + "learning_rate": 6.562314540059348e-06, + "loss": 1.0504, + "step": 46840 + }, + { + "epoch": 6.92, + "eval_loss": 0.9087313413619995, + "eval_runtime": 523.7866, + "eval_samples_per_second": 14.584, + "eval_wer": 0.3373166757197175, + "step": 46840 + }, + { + "epoch": 6.93, + "learning_rate": 6.559347181008902e-06, + "loss": 0.9373, + "step": 46880 + }, + { + "epoch": 6.93, + "eval_loss": 0.9822513461112976, + "eval_runtime": 520.1839, + "eval_samples_per_second": 14.685, + "eval_wer": 0.34337745504445527, + "step": 46880 + }, + { + "epoch": 6.94, + "learning_rate": 6.556379821958458e-06, + "loss": 1.022, + "step": 46920 + }, + { + "epoch": 6.94, + "eval_loss": 0.952470064163208, + "eval_runtime": 520.0643, + "eval_samples_per_second": 14.689, + "eval_wer": 0.34146202006918436, + "step": 46920 + }, + { + "epoch": 6.94, + "learning_rate": 6.553412462908012e-06, + "loss": 1.0284, + "step": 46960 + }, + { + "epoch": 6.94, + "eval_loss": 0.9467082023620605, + "eval_runtime": 523.0265, + "eval_samples_per_second": 14.605, + "eval_wer": 0.34008976814660224, + "step": 46960 + }, + { + "epoch": 6.95, + "learning_rate": 6.550445103857568e-06, + "loss": 1.008, + "step": 47000 + }, + { + "epoch": 6.95, + "eval_loss": 0.9011938571929932, + "eval_runtime": 518.9318, + "eval_samples_per_second": 14.721, + "eval_wer": 0.33651619543154465, + "step": 47000 + }, + { + "epoch": 6.95, + "learning_rate": 6.547477744807123e-06, + "loss": 1.0156, + "step": 47040 + }, + { + "epoch": 6.95, + "eval_loss": 0.9419434070587158, + "eval_runtime": 520.4066, + "eval_samples_per_second": 14.679, + "eval_wer": 0.3391749335315475, + "step": 47040 + }, + { + "epoch": 6.96, + "learning_rate": 6.544510385756677e-06, + "loss": 1.023, + "step": 47080 + }, + { + "epoch": 6.96, + "eval_loss": 0.920754611492157, + "eval_runtime": 520.9483, + "eval_samples_per_second": 14.664, + "eval_wer": 0.3384316304068155, + "step": 47080 + }, + { + "epoch": 6.97, + "learning_rate": 6.5415430267062315e-06, + "loss": 1.0414, + "step": 47120 + }, + { + "epoch": 6.97, + "eval_loss": 0.940671443939209, + "eval_runtime": 520.1854, + "eval_samples_per_second": 14.685, + "eval_wer": 0.33974670516595673, + "step": 47120 + }, + { + "epoch": 6.97, + "learning_rate": 6.538575667655787e-06, + "loss": 1.0349, + "step": 47160 + }, + { + "epoch": 6.97, + "eval_loss": 0.9437512755393982, + "eval_runtime": 517.697, + "eval_samples_per_second": 14.756, + "eval_wer": 0.3402041224734841, + "step": 47160 + }, + { + "epoch": 6.98, + "learning_rate": 6.535608308605341e-06, + "loss": 0.986, + "step": 47200 + }, + { + "epoch": 6.98, + "eval_loss": 0.9611278176307678, + "eval_runtime": 519.9279, + "eval_samples_per_second": 14.692, + "eval_wer": 0.3420052031218731, + "step": 47200 + }, + { + "epoch": 6.98, + "learning_rate": 6.532640949554897e-06, + "loss": 0.9749, + "step": 47240 + }, + { + "epoch": 6.98, + "eval_loss": 0.9494714140892029, + "eval_runtime": 522.8639, + "eval_samples_per_second": 14.61, + "eval_wer": 0.3401469453100432, + "step": 47240 + }, + { + "epoch": 6.99, + "learning_rate": 6.529673590504452e-06, + "loss": 1.0868, + "step": 47280 + }, + { + "epoch": 6.99, + "eval_loss": 0.9364571571350098, + "eval_runtime": 519.1193, + "eval_samples_per_second": 14.715, + "eval_wer": 0.33891763629606336, + "step": 47280 + }, + { + "epoch": 6.99, + "learning_rate": 6.526706231454006e-06, + "loss": 0.999, + "step": 47320 + }, + { + "epoch": 6.99, + "eval_loss": 0.9458136558532715, + "eval_runtime": 520.178, + "eval_samples_per_second": 14.685, + "eval_wer": 0.3388890477143429, + "step": 47320 + }, + { + "epoch": 7.0, + "learning_rate": 6.523738872403561e-06, + "loss": 0.9456, + "step": 47360 + }, + { + "epoch": 7.0, + "eval_loss": 1.022178053855896, + "eval_runtime": 517.6267, + "eval_samples_per_second": 14.758, + "eval_wer": 0.3456645415820921, + "step": 47360 + }, + { + "epoch": 7.01, + "learning_rate": 6.520771513353116e-06, + "loss": 0.9654, + "step": 47400 + }, + { + "epoch": 7.01, + "eval_loss": 1.0016549825668335, + "eval_runtime": 517.3942, + "eval_samples_per_second": 14.764, + "eval_wer": 0.34426370107778953, + "step": 47400 + }, + { + "epoch": 7.01, + "learning_rate": 6.517804154302671e-06, + "loss": 0.9883, + "step": 47440 + }, + { + "epoch": 7.01, + "eval_loss": 0.980663001537323, + "eval_runtime": 518.3567, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3420909688670345, + "step": 47440 + }, + { + "epoch": 7.02, + "learning_rate": 6.5148367952522265e-06, + "loss": 0.9802, + "step": 47480 + }, + { + "epoch": 7.02, + "eval_loss": 0.9422715902328491, + "eval_runtime": 520.8303, + "eval_samples_per_second": 14.667, + "eval_wer": 0.33906057920466565, + "step": 47480 + }, + { + "epoch": 7.02, + "learning_rate": 6.511869436201781e-06, + "loss": 1.0004, + "step": 47520 + }, + { + "epoch": 7.02, + "eval_loss": 0.9424909353256226, + "eval_runtime": 517.6095, + "eval_samples_per_second": 14.758, + "eval_wer": 0.3393750536035907, + "step": 47520 + }, + { + "epoch": 7.03, + "learning_rate": 6.5089020771513354e-06, + "loss": 1.0626, + "step": 47560 + }, + { + "epoch": 7.03, + "eval_loss": 0.890785813331604, + "eval_runtime": 517.1815, + "eval_samples_per_second": 14.77, + "eval_wer": 0.33460076045627374, + "step": 47560 + }, + { + "epoch": 7.04, + "learning_rate": 6.50593471810089e-06, + "loss": 0.992, + "step": 47600 + }, + { + "epoch": 7.04, + "eval_loss": 0.9768620133399963, + "eval_runtime": 522.2821, + "eval_samples_per_second": 14.626, + "eval_wer": 0.3408044826896138, + "step": 47600 + }, + { + "epoch": 7.04, + "learning_rate": 6.502967359050446e-06, + "loss": 1.013, + "step": 47640 + }, + { + "epoch": 7.04, + "eval_loss": 0.954316258430481, + "eval_runtime": 517.9828, + "eval_samples_per_second": 14.748, + "eval_wer": 0.3398038823293976, + "step": 47640 + }, + { + "epoch": 7.05, + "learning_rate": 6.5000000000000004e-06, + "loss": 1.0882, + "step": 47680 + }, + { + "epoch": 7.05, + "eval_loss": 0.8957270979881287, + "eval_runtime": 517.6938, + "eval_samples_per_second": 14.756, + "eval_wer": 0.3352868864175648, + "step": 47680 + }, + { + "epoch": 7.05, + "learning_rate": 6.497032640949556e-06, + "loss": 0.9787, + "step": 47720 + }, + { + "epoch": 7.05, + "eval_loss": 0.9949858784675598, + "eval_runtime": 520.8717, + "eval_samples_per_second": 14.666, + "eval_wer": 0.3427770948283256, + "step": 47720 + }, + { + "epoch": 7.06, + "learning_rate": 6.49406528189911e-06, + "loss": 1.0845, + "step": 47760 + }, + { + "epoch": 7.06, + "eval_loss": 0.914729118347168, + "eval_runtime": 517.1607, + "eval_samples_per_second": 14.771, + "eval_wer": 0.33634466394122187, + "step": 47760 + }, + { + "epoch": 7.07, + "learning_rate": 6.491097922848665e-06, + "loss": 0.9758, + "step": 47800 + }, + { + "epoch": 7.07, + "eval_loss": 0.8954439163208008, + "eval_runtime": 517.7767, + "eval_samples_per_second": 14.753, + "eval_wer": 0.33454358329283285, + "step": 47800 + }, + { + "epoch": 7.07, + "learning_rate": 6.488130563798221e-06, + "loss": 1.0048, + "step": 47840 + }, + { + "epoch": 7.07, + "eval_loss": 0.9299134612083435, + "eval_runtime": 517.3405, + "eval_samples_per_second": 14.766, + "eval_wer": 0.33583006947025357, + "step": 47840 + }, + { + "epoch": 7.08, + "learning_rate": 6.485163204747775e-06, + "loss": 0.9741, + "step": 47880 + }, + { + "epoch": 7.08, + "eval_loss": 0.9108271598815918, + "eval_runtime": 518.103, + "eval_samples_per_second": 14.744, + "eval_wer": 0.33488664627347836, + "step": 47880 + }, + { + "epoch": 7.08, + "learning_rate": 6.48219584569733e-06, + "loss": 1.0534, + "step": 47920 + }, + { + "epoch": 7.08, + "eval_loss": 0.8777278065681458, + "eval_runtime": 516.8775, + "eval_samples_per_second": 14.779, + "eval_wer": 0.33317133137025073, + "step": 47920 + }, + { + "epoch": 7.09, + "learning_rate": 6.479228486646885e-06, + "loss": 1.0529, + "step": 47960 + }, + { + "epoch": 7.09, + "eval_loss": 0.9484491944313049, + "eval_runtime": 517.9353, + "eval_samples_per_second": 14.749, + "eval_wer": 0.3375739729552017, + "step": 47960 + }, + { + "epoch": 7.1, + "learning_rate": 6.476261127596439e-06, + "loss": 1.0025, + "step": 48000 + }, + { + "epoch": 7.1, + "eval_loss": 0.9103545546531677, + "eval_runtime": 518.4957, + "eval_samples_per_second": 14.733, + "eval_wer": 0.33497241201863975, + "step": 48000 + }, + { + "epoch": 7.1, + "learning_rate": 6.4732937685459955e-06, + "loss": 1.0184, + "step": 48040 + }, + { + "epoch": 7.1, + "eval_loss": 0.949988842010498, + "eval_runtime": 518.7937, + "eval_samples_per_second": 14.725, + "eval_wer": 0.3372594985562766, + "step": 48040 + }, + { + "epoch": 7.11, + "learning_rate": 6.47032640949555e-06, + "loss": 1.0725, + "step": 48080 + }, + { + "epoch": 7.11, + "eval_loss": 0.9352774620056152, + "eval_runtime": 522.2188, + "eval_samples_per_second": 14.628, + "eval_wer": 0.33617313245089914, + "step": 48080 + }, + { + "epoch": 7.11, + "learning_rate": 6.467359050445104e-06, + "loss": 1.0112, + "step": 48120 + }, + { + "epoch": 7.11, + "eval_loss": 0.9344502687454224, + "eval_runtime": 518.6874, + "eval_samples_per_second": 14.728, + "eval_wer": 0.33623030961434003, + "step": 48120 + }, + { + "epoch": 7.12, + "learning_rate": 6.464391691394659e-06, + "loss": 1.1463, + "step": 48160 + }, + { + "epoch": 7.12, + "eval_loss": 0.9344373345375061, + "eval_runtime": 517.6771, + "eval_samples_per_second": 14.756, + "eval_wer": 0.33708796706595384, + "step": 48160 + }, + { + "epoch": 7.12, + "learning_rate": 6.461424332344214e-06, + "loss": 1.0512, + "step": 48200 + }, + { + "epoch": 7.12, + "eval_loss": 0.9003881812095642, + "eval_runtime": 519.1711, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3344864061293919, + "step": 48200 + }, + { + "epoch": 7.13, + "learning_rate": 6.4584569732937686e-06, + "loss": 1.0625, + "step": 48240 + }, + { + "epoch": 7.13, + "eval_loss": 0.934649646282196, + "eval_runtime": 518.3189, + "eval_samples_per_second": 14.738, + "eval_wer": 0.33760256153692214, + "step": 48240 + }, + { + "epoch": 7.14, + "learning_rate": 6.455489614243325e-06, + "loss": 0.9722, + "step": 48280 + }, + { + "epoch": 7.14, + "eval_loss": 0.9528153538703918, + "eval_runtime": 517.641, + "eval_samples_per_second": 14.757, + "eval_wer": 0.33871751622402013, + "step": 48280 + }, + { + "epoch": 7.14, + "learning_rate": 6.452522255192879e-06, + "loss": 0.9606, + "step": 48320 + }, + { + "epoch": 7.14, + "eval_loss": 0.9660664200782776, + "eval_runtime": 522.0228, + "eval_samples_per_second": 14.633, + "eval_wer": 0.33974670516595673, + "step": 48320 + }, + { + "epoch": 7.15, + "learning_rate": 6.449554896142434e-06, + "loss": 1.0266, + "step": 48360 + }, + { + "epoch": 7.15, + "eval_loss": 0.9631533622741699, + "eval_runtime": 519.5817, + "eval_samples_per_second": 14.702, + "eval_wer": 0.3386603390605792, + "step": 48360 + }, + { + "epoch": 7.15, + "learning_rate": 6.446587537091988e-06, + "loss": 1.0468, + "step": 48400 + }, + { + "epoch": 7.15, + "eval_loss": 0.9267898797988892, + "eval_runtime": 518.959, + "eval_samples_per_second": 14.72, + "eval_wer": 0.33737385288315846, + "step": 48400 + }, + { + "epoch": 7.16, + "learning_rate": 6.443620178041543e-06, + "loss": 1.1139, + "step": 48440 + }, + { + "epoch": 7.16, + "eval_loss": 0.9207188487052917, + "eval_runtime": 518.8029, + "eval_samples_per_second": 14.724, + "eval_wer": 0.33708796706595384, + "step": 48440 + }, + { + "epoch": 7.17, + "learning_rate": 6.440652818991099e-06, + "loss": 0.9846, + "step": 48480 + }, + { + "epoch": 7.17, + "eval_loss": 0.9798438549041748, + "eval_runtime": 520.2663, + "eval_samples_per_second": 14.683, + "eval_wer": 0.34140484290574347, + "step": 48480 + }, + { + "epoch": 7.17, + "learning_rate": 6.437685459940654e-06, + "loss": 1.0204, + "step": 48520 + }, + { + "epoch": 7.17, + "eval_loss": 0.9092714190483093, + "eval_runtime": 518.571, + "eval_samples_per_second": 14.731, + "eval_wer": 0.33591583521541496, + "step": 48520 + }, + { + "epoch": 7.18, + "learning_rate": 6.434718100890208e-06, + "loss": 0.9503, + "step": 48560 + }, + { + "epoch": 7.18, + "eval_loss": 0.9233335852622986, + "eval_runtime": 517.6466, + "eval_samples_per_second": 14.757, + "eval_wer": 0.33708796706595384, + "step": 48560 + }, + { + "epoch": 7.18, + "learning_rate": 6.431750741839763e-06, + "loss": 0.9755, + "step": 48600 + }, + { + "epoch": 7.18, + "eval_loss": 0.9563552141189575, + "eval_runtime": 519.146, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3386031618971383, + "step": 48600 + }, + { + "epoch": 7.19, + "learning_rate": 6.428783382789317e-06, + "loss": 1.0387, + "step": 48640 + }, + { + "epoch": 7.19, + "eval_loss": 0.9228087067604065, + "eval_runtime": 519.6073, + "eval_samples_per_second": 14.701, + "eval_wer": 0.3365447840132651, + "step": 48640 + }, + { + "epoch": 7.2, + "learning_rate": 6.425816023738873e-06, + "loss": 0.98, + "step": 48680 + }, + { + "epoch": 7.2, + "eval_loss": 0.9403106570243835, + "eval_runtime": 518.3568, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3375739729552017, + "step": 48680 + }, + { + "epoch": 7.2, + "learning_rate": 6.422848664688428e-06, + "loss": 1.0236, + "step": 48720 + }, + { + "epoch": 7.2, + "eval_loss": 0.9320812225341797, + "eval_runtime": 519.1441, + "eval_samples_per_second": 14.715, + "eval_wer": 0.33643042968638326, + "step": 48720 + }, + { + "epoch": 7.21, + "learning_rate": 6.419881305637983e-06, + "loss": 1.0239, + "step": 48760 + }, + { + "epoch": 7.21, + "eval_loss": 0.9221595525741577, + "eval_runtime": 521.6914, + "eval_samples_per_second": 14.643, + "eval_wer": 0.3358014808885331, + "step": 48760 + }, + { + "epoch": 7.21, + "learning_rate": 6.4169139465875375e-06, + "loss": 0.9724, + "step": 48800 + }, + { + "epoch": 7.21, + "eval_loss": 0.9507524371147156, + "eval_runtime": 519.0042, + "eval_samples_per_second": 14.719, + "eval_wer": 0.3386031618971383, + "step": 48800 + }, + { + "epoch": 7.22, + "learning_rate": 6.413946587537092e-06, + "loss": 0.9809, + "step": 48840 + }, + { + "epoch": 7.22, + "eval_loss": 0.9051950573921204, + "eval_runtime": 518.8328, + "eval_samples_per_second": 14.723, + "eval_wer": 0.3337145144229395, + "step": 48840 + }, + { + "epoch": 7.23, + "learning_rate": 6.410979228486648e-06, + "loss": 1.0199, + "step": 48880 + }, + { + "epoch": 7.23, + "eval_loss": 1.002166509628296, + "eval_runtime": 519.9952, + "eval_samples_per_second": 14.691, + "eval_wer": 0.341747905886389, + "step": 48880 + }, + { + "epoch": 7.23, + "learning_rate": 6.4080118694362025e-06, + "loss": 1.0249, + "step": 48920 + }, + { + "epoch": 7.23, + "eval_loss": 0.9676195979118347, + "eval_runtime": 517.6174, + "eval_samples_per_second": 14.758, + "eval_wer": 0.339889648074559, + "step": 48920 + }, + { + "epoch": 7.24, + "learning_rate": 6.405044510385757e-06, + "loss": 1.0639, + "step": 48960 + }, + { + "epoch": 7.24, + "eval_loss": 0.9231087565422058, + "eval_runtime": 518.8067, + "eval_samples_per_second": 14.724, + "eval_wer": 0.33608736670573774, + "step": 48960 + }, + { + "epoch": 7.24, + "learning_rate": 6.402077151335312e-06, + "loss": 1.1407, + "step": 49000 + }, + { + "epoch": 7.24, + "eval_loss": 0.9747340083122253, + "eval_runtime": 518.374, + "eval_samples_per_second": 14.736, + "eval_wer": 0.3400325909831613, + "step": 49000 + }, + { + "epoch": 7.25, + "learning_rate": 6.399109792284867e-06, + "loss": 0.9436, + "step": 49040 + }, + { + "epoch": 7.25, + "eval_loss": 0.9569833278656006, + "eval_runtime": 518.9994, + "eval_samples_per_second": 14.719, + "eval_wer": 0.3388890477143429, + "step": 49040 + }, + { + "epoch": 7.25, + "learning_rate": 6.396142433234422e-06, + "loss": 0.9907, + "step": 49080 + }, + { + "epoch": 7.25, + "eval_loss": 0.9232583045959473, + "eval_runtime": 518.5449, + "eval_samples_per_second": 14.732, + "eval_wer": 0.33488664627347836, + "step": 49080 + }, + { + "epoch": 7.26, + "learning_rate": 6.393175074183977e-06, + "loss": 1.0221, + "step": 49120 + }, + { + "epoch": 7.26, + "eval_loss": 0.9653372168540955, + "eval_runtime": 518.189, + "eval_samples_per_second": 14.742, + "eval_wer": 0.3383458646616541, + "step": 49120 + }, + { + "epoch": 7.27, + "learning_rate": 6.390207715133532e-06, + "loss": 1.0051, + "step": 49160 + }, + { + "epoch": 7.27, + "eval_loss": 0.9079302549362183, + "eval_runtime": 521.4996, + "eval_samples_per_second": 14.648, + "eval_wer": 0.33505817776380115, + "step": 49160 + }, + { + "epoch": 7.27, + "learning_rate": 6.387240356083086e-06, + "loss": 0.9932, + "step": 49200 + }, + { + "epoch": 7.27, + "eval_loss": 0.9315870404243469, + "eval_runtime": 519.0884, + "eval_samples_per_second": 14.716, + "eval_wer": 0.3364590182681037, + "step": 49200 + }, + { + "epoch": 7.28, + "learning_rate": 6.3842729970326415e-06, + "loss": 0.9634, + "step": 49240 + }, + { + "epoch": 7.28, + "eval_loss": 0.9709529280662537, + "eval_runtime": 518.8431, + "eval_samples_per_second": 14.723, + "eval_wer": 0.3394608193487521, + "step": 49240 + }, + { + "epoch": 7.28, + "learning_rate": 6.381305637982196e-06, + "loss": 1.0648, + "step": 49280 + }, + { + "epoch": 7.28, + "eval_loss": 0.9377908110618591, + "eval_runtime": 520.0025, + "eval_samples_per_second": 14.69, + "eval_wer": 0.3372023213928357, + "step": 49280 + }, + { + "epoch": 7.29, + "learning_rate": 6.378338278931751e-06, + "loss": 1.0007, + "step": 49320 + }, + { + "epoch": 7.29, + "eval_loss": 0.9122663736343384, + "eval_runtime": 519.231, + "eval_samples_per_second": 14.712, + "eval_wer": 0.3354584179078876, + "step": 49320 + }, + { + "epoch": 7.3, + "learning_rate": 6.3753709198813065e-06, + "loss": 0.9773, + "step": 49360 + }, + { + "epoch": 7.3, + "eval_loss": 0.9604159593582153, + "eval_runtime": 519.1171, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3388604591326224, + "step": 49360 + }, + { + "epoch": 7.3, + "learning_rate": 6.372403560830861e-06, + "loss": 1.0463, + "step": 49400 + }, + { + "epoch": 7.3, + "eval_loss": 0.9135463237762451, + "eval_runtime": 524.0276, + "eval_samples_per_second": 14.577, + "eval_wer": 0.33557277223476945, + "step": 49400 + }, + { + "epoch": 7.31, + "learning_rate": 6.369436201780415e-06, + "loss": 1.0393, + "step": 49440 + }, + { + "epoch": 7.31, + "eval_loss": 0.9357494115829468, + "eval_runtime": 518.4021, + "eval_samples_per_second": 14.736, + "eval_wer": 0.33623030961434003, + "step": 49440 + }, + { + "epoch": 7.31, + "learning_rate": 6.366468842729971e-06, + "loss": 0.976, + "step": 49480 + }, + { + "epoch": 7.31, + "eval_loss": 0.9702383279800415, + "eval_runtime": 522.5395, + "eval_samples_per_second": 14.619, + "eval_wer": 0.3392606992767089, + "step": 49480 + }, + { + "epoch": 7.32, + "learning_rate": 6.363501483679526e-06, + "loss": 0.9735, + "step": 49520 + }, + { + "epoch": 7.32, + "eval_loss": 0.9268819689750671, + "eval_runtime": 524.6711, + "eval_samples_per_second": 14.56, + "eval_wer": 0.33520112067240343, + "step": 49520 + }, + { + "epoch": 7.33, + "learning_rate": 6.360534124629081e-06, + "loss": 0.9757, + "step": 49560 + }, + { + "epoch": 7.33, + "eval_loss": 0.9248133897781372, + "eval_runtime": 518.8479, + "eval_samples_per_second": 14.723, + "eval_wer": 0.33557277223476945, + "step": 49560 + }, + { + "epoch": 7.33, + "learning_rate": 6.357566765578636e-06, + "loss": 0.9881, + "step": 49600 + }, + { + "epoch": 7.33, + "eval_loss": 0.9447203278541565, + "eval_runtime": 518.821, + "eval_samples_per_second": 14.724, + "eval_wer": 0.3372309099745562, + "step": 49600 + }, + { + "epoch": 7.34, + "learning_rate": 6.35459940652819e-06, + "loss": 1.0503, + "step": 49640 + }, + { + "epoch": 7.34, + "eval_loss": 0.9256668090820312, + "eval_runtime": 519.8788, + "eval_samples_per_second": 14.694, + "eval_wer": 0.336287486777781, + "step": 49640 + }, + { + "epoch": 7.34, + "learning_rate": 6.3516320474777446e-06, + "loss": 1.0098, + "step": 49680 + }, + { + "epoch": 7.34, + "eval_loss": 0.9638358950614929, + "eval_runtime": 519.3222, + "eval_samples_per_second": 14.71, + "eval_wer": 0.33871751622402013, + "step": 49680 + }, + { + "epoch": 7.35, + "learning_rate": 6.348664688427301e-06, + "loss": 1.0504, + "step": 49720 + }, + { + "epoch": 7.35, + "eval_loss": 0.884833037853241, + "eval_runtime": 519.6024, + "eval_samples_per_second": 14.702, + "eval_wer": 0.3327139140627233, + "step": 49720 + }, + { + "epoch": 7.36, + "learning_rate": 6.345697329376855e-06, + "loss": 1.0005, + "step": 49760 + }, + { + "epoch": 7.36, + "eval_loss": 0.9212217926979065, + "eval_runtime": 521.2208, + "eval_samples_per_second": 14.656, + "eval_wer": 0.33520112067240343, + "step": 49760 + }, + { + "epoch": 7.36, + "learning_rate": 6.3427299703264104e-06, + "loss": 0.9379, + "step": 49800 + }, + { + "epoch": 7.36, + "eval_loss": 0.9602131247520447, + "eval_runtime": 519.6828, + "eval_samples_per_second": 14.699, + "eval_wer": 0.3386031618971383, + "step": 49800 + }, + { + "epoch": 7.37, + "learning_rate": 6.339762611275965e-06, + "loss": 0.9778, + "step": 49840 + }, + { + "epoch": 7.37, + "eval_loss": 0.9330121874809265, + "eval_runtime": 519.038, + "eval_samples_per_second": 14.718, + "eval_wer": 0.33548700648960805, + "step": 49840 + }, + { + "epoch": 7.37, + "learning_rate": 6.336795252225519e-06, + "loss": 1.0321, + "step": 49880 + }, + { + "epoch": 7.37, + "eval_loss": 0.9249868988990784, + "eval_runtime": 518.6502, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3353726521627262, + "step": 49880 + }, + { + "epoch": 7.38, + "learning_rate": 6.3338278931750755e-06, + "loss": 1.046, + "step": 49920 + }, + { + "epoch": 7.38, + "eval_loss": 0.9259698987007141, + "eval_runtime": 520.9618, + "eval_samples_per_second": 14.663, + "eval_wer": 0.33565853797993084, + "step": 49920 + }, + { + "epoch": 7.39, + "learning_rate": 6.33086053412463e-06, + "loss": 1.0411, + "step": 49960 + }, + { + "epoch": 7.39, + "eval_loss": 0.9152907729148865, + "eval_runtime": 519.674, + "eval_samples_per_second": 14.7, + "eval_wer": 0.33440064038423056, + "step": 49960 + }, + { + "epoch": 7.39, + "learning_rate": 6.327893175074184e-06, + "loss": 1.0291, + "step": 50000 + }, + { + "epoch": 7.39, + "eval_loss": 0.9502978920936584, + "eval_runtime": 520.9246, + "eval_samples_per_second": 14.664, + "eval_wer": 0.3368306698304697, + "step": 50000 + }, + { + "epoch": 7.4, + "learning_rate": 6.32492581602374e-06, + "loss": 1.0376, + "step": 50040 + }, + { + "epoch": 7.4, + "eval_loss": 0.9250549674034119, + "eval_runtime": 520.1746, + "eval_samples_per_second": 14.685, + "eval_wer": 0.3360301895422968, + "step": 50040 + }, + { + "epoch": 7.4, + "learning_rate": 6.321958456973294e-06, + "loss": 0.981, + "step": 50080 + }, + { + "epoch": 7.4, + "eval_loss": 0.9222678542137146, + "eval_runtime": 520.5542, + "eval_samples_per_second": 14.675, + "eval_wer": 0.33505817776380115, + "step": 50080 + }, + { + "epoch": 7.41, + "learning_rate": 6.318991097922849e-06, + "loss": 0.9927, + "step": 50120 + }, + { + "epoch": 7.41, + "eval_loss": 0.9609561562538147, + "eval_runtime": 520.5149, + "eval_samples_per_second": 14.676, + "eval_wer": 0.3372023213928357, + "step": 50120 + }, + { + "epoch": 7.41, + "learning_rate": 6.316023738872405e-06, + "loss": 1.063, + "step": 50160 + }, + { + "epoch": 7.41, + "eval_loss": 0.968572199344635, + "eval_runtime": 519.5879, + "eval_samples_per_second": 14.702, + "eval_wer": 0.33797421309928816, + "step": 50160 + }, + { + "epoch": 7.42, + "learning_rate": 6.313056379821959e-06, + "loss": 1.0368, + "step": 50200 + }, + { + "epoch": 7.42, + "eval_loss": 0.9010893702507019, + "eval_runtime": 519.4537, + "eval_samples_per_second": 14.706, + "eval_wer": 0.3337716915863804, + "step": 50200 + }, + { + "epoch": 7.43, + "learning_rate": 6.3100890207715135e-06, + "loss": 0.9354, + "step": 50240 + }, + { + "epoch": 7.43, + "eval_loss": 0.9421952366828918, + "eval_runtime": 519.7807, + "eval_samples_per_second": 14.697, + "eval_wer": 0.3362588981960605, + "step": 50240 + }, + { + "epoch": 7.43, + "learning_rate": 6.307121661721069e-06, + "loss": 1.0611, + "step": 50280 + }, + { + "epoch": 7.43, + "eval_loss": 0.8898743391036987, + "eval_runtime": 519.0623, + "eval_samples_per_second": 14.717, + "eval_wer": 0.3331999199519712, + "step": 50280 + }, + { + "epoch": 7.44, + "learning_rate": 6.304154302670623e-06, + "loss": 0.9981, + "step": 50320 + }, + { + "epoch": 7.44, + "eval_loss": 0.9190933704376221, + "eval_runtime": 517.4504, + "eval_samples_per_second": 14.763, + "eval_wer": 0.33482946911003747, + "step": 50320 + }, + { + "epoch": 7.44, + "learning_rate": 6.3011869436201786e-06, + "loss": 0.9795, + "step": 50360 + }, + { + "epoch": 7.44, + "eval_loss": 0.932735025882721, + "eval_runtime": 518.8218, + "eval_samples_per_second": 14.724, + "eval_wer": 0.3358872466336945, + "step": 50360 + }, + { + "epoch": 7.45, + "learning_rate": 6.298219584569734e-06, + "loss": 1.016, + "step": 50400 + }, + { + "epoch": 7.45, + "eval_loss": 0.9249831438064575, + "eval_runtime": 520.4809, + "eval_samples_per_second": 14.677, + "eval_wer": 0.3362588981960605, + "step": 50400 + }, + { + "epoch": 7.46, + "learning_rate": 6.295252225519288e-06, + "loss": 0.9185, + "step": 50440 + }, + { + "epoch": 7.46, + "eval_loss": 0.9831563234329224, + "eval_runtime": 518.8307, + "eval_samples_per_second": 14.723, + "eval_wer": 0.3399754138197204, + "step": 50440 + }, + { + "epoch": 7.46, + "learning_rate": 6.292284866468843e-06, + "loss": 1.0498, + "step": 50480 + }, + { + "epoch": 7.46, + "eval_loss": 0.921595573425293, + "eval_runtime": 518.7714, + "eval_samples_per_second": 14.725, + "eval_wer": 0.33520112067240343, + "step": 50480 + }, + { + "epoch": 7.47, + "learning_rate": 6.289317507418398e-06, + "loss": 1.0443, + "step": 50520 + }, + { + "epoch": 7.47, + "eval_loss": 0.9293116331100464, + "eval_runtime": 519.3691, + "eval_samples_per_second": 14.708, + "eval_wer": 0.3352297092541239, + "step": 50520 + }, + { + "epoch": 7.47, + "learning_rate": 6.286350148367953e-06, + "loss": 0.978, + "step": 50560 + }, + { + "epoch": 7.47, + "eval_loss": 0.9404312372207642, + "eval_runtime": 519.2506, + "eval_samples_per_second": 14.712, + "eval_wer": 0.33583006947025357, + "step": 50560 + }, + { + "epoch": 7.48, + "learning_rate": 6.283382789317508e-06, + "loss": 1.0217, + "step": 50600 + }, + { + "epoch": 7.48, + "eval_loss": 0.9481327533721924, + "eval_runtime": 519.1078, + "eval_samples_per_second": 14.716, + "eval_wer": 0.33608736670573774, + "step": 50600 + }, + { + "epoch": 7.49, + "learning_rate": 6.280415430267063e-06, + "loss": 0.9993, + "step": 50640 + }, + { + "epoch": 7.49, + "eval_loss": 0.9372439384460449, + "eval_runtime": 519.3141, + "eval_samples_per_second": 14.71, + "eval_wer": 0.335544183653049, + "step": 50640 + }, + { + "epoch": 7.49, + "learning_rate": 6.2774480712166175e-06, + "loss": 1.0309, + "step": 50680 + }, + { + "epoch": 7.49, + "eval_loss": 0.9557296633720398, + "eval_runtime": 519.4073, + "eval_samples_per_second": 14.707, + "eval_wer": 0.33751679579176075, + "step": 50680 + }, + { + "epoch": 7.5, + "learning_rate": 6.274480712166172e-06, + "loss": 1.0643, + "step": 50720 + }, + { + "epoch": 7.5, + "eval_loss": 0.9240292906761169, + "eval_runtime": 519.3164, + "eval_samples_per_second": 14.71, + "eval_wer": 0.33497241201863975, + "step": 50720 + }, + { + "epoch": 7.5, + "learning_rate": 6.271513353115728e-06, + "loss": 1.0119, + "step": 50760 + }, + { + "epoch": 7.5, + "eval_loss": 0.9881883859634399, + "eval_runtime": 518.195, + "eval_samples_per_second": 14.742, + "eval_wer": 0.33974670516595673, + "step": 50760 + }, + { + "epoch": 7.51, + "learning_rate": 6.2685459940652825e-06, + "loss": 1.0225, + "step": 50800 + }, + { + "epoch": 7.51, + "eval_loss": 0.9036035537719727, + "eval_runtime": 519.0202, + "eval_samples_per_second": 14.718, + "eval_wer": 0.33345721718745536, + "step": 50800 + }, + { + "epoch": 7.52, + "learning_rate": 6.265578635014837e-06, + "loss": 0.9776, + "step": 50840 + }, + { + "epoch": 7.52, + "eval_loss": 0.9353271126747131, + "eval_runtime": 520.0686, + "eval_samples_per_second": 14.688, + "eval_wer": 0.33608736670573774, + "step": 50840 + }, + { + "epoch": 7.52, + "learning_rate": 6.262611275964392e-06, + "loss": 1.0412, + "step": 50880 + }, + { + "epoch": 7.52, + "eval_loss": 0.9424023628234863, + "eval_runtime": 519.7855, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3362017210326196, + "step": 50880 + }, + { + "epoch": 7.53, + "learning_rate": 6.259643916913947e-06, + "loss": 1.0487, + "step": 50920 + }, + { + "epoch": 7.53, + "eval_loss": 0.9515993595123291, + "eval_runtime": 519.3584, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3378312701906858, + "step": 50920 + }, + { + "epoch": 7.53, + "learning_rate": 6.256676557863503e-06, + "loss": 0.9842, + "step": 50960 + }, + { + "epoch": 7.53, + "eval_loss": 0.9900578260421753, + "eval_runtime": 523.7661, + "eval_samples_per_second": 14.585, + "eval_wer": 0.33934646502187027, + "step": 50960 + }, + { + "epoch": 7.54, + "learning_rate": 6.253709198813057e-06, + "loss": 1.1195, + "step": 51000 + }, + { + "epoch": 7.54, + "eval_loss": 0.9938927292823792, + "eval_runtime": 520.0585, + "eval_samples_per_second": 14.689, + "eval_wer": 0.3390319906229452, + "step": 51000 + }, + { + "epoch": 7.54, + "learning_rate": 6.250741839762612e-06, + "loss": 0.9863, + "step": 51040 + }, + { + "epoch": 7.54, + "eval_loss": 0.9372184872627258, + "eval_runtime": 519.1616, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3356013608164899, + "step": 51040 + }, + { + "epoch": 7.55, + "learning_rate": 6.247774480712166e-06, + "loss": 1.0444, + "step": 51080 + }, + { + "epoch": 7.55, + "eval_loss": 0.9623214602470398, + "eval_runtime": 518.005, + "eval_samples_per_second": 14.747, + "eval_wer": 0.3372880871379971, + "step": 51080 + }, + { + "epoch": 7.56, + "learning_rate": 6.244807121661721e-06, + "loss": 1.106, + "step": 51120 + }, + { + "epoch": 7.56, + "eval_loss": 0.8742450475692749, + "eval_runtime": 520.0657, + "eval_samples_per_second": 14.689, + "eval_wer": 0.33105577632293665, + "step": 51120 + }, + { + "epoch": 7.56, + "learning_rate": 6.241839762611277e-06, + "loss": 1.1903, + "step": 51160 + }, + { + "epoch": 7.56, + "eval_loss": 0.8926132321357727, + "eval_runtime": 520.6411, + "eval_samples_per_second": 14.672, + "eval_wer": 0.3316561365390663, + "step": 51160 + }, + { + "epoch": 7.57, + "learning_rate": 6.238872403560832e-06, + "loss": 1.0077, + "step": 51200 + }, + { + "epoch": 7.57, + "eval_loss": 0.9220393896102905, + "eval_runtime": 519.6512, + "eval_samples_per_second": 14.7, + "eval_wer": 0.3342576974756282, + "step": 51200 + }, + { + "epoch": 7.57, + "learning_rate": 6.2359050445103864e-06, + "loss": 1.0206, + "step": 51240 + }, + { + "epoch": 7.57, + "eval_loss": 0.9552518129348755, + "eval_runtime": 519.378, + "eval_samples_per_second": 14.708, + "eval_wer": 0.3356013608164899, + "step": 51240 + }, + { + "epoch": 7.58, + "learning_rate": 6.232937685459941e-06, + "loss": 1.0389, + "step": 51280 + }, + { + "epoch": 7.58, + "eval_loss": 0.8979615569114685, + "eval_runtime": 518.4658, + "eval_samples_per_second": 14.734, + "eval_wer": 0.33145601646702305, + "step": 51280 + }, + { + "epoch": 7.59, + "learning_rate": 6.229970326409495e-06, + "loss": 0.9826, + "step": 51320 + }, + { + "epoch": 7.59, + "eval_loss": 0.9164960384368896, + "eval_runtime": 519.5823, + "eval_samples_per_second": 14.702, + "eval_wer": 0.3330569770433689, + "step": 51320 + }, + { + "epoch": 7.59, + "learning_rate": 6.227002967359051e-06, + "loss": 1.0587, + "step": 51360 + }, + { + "epoch": 7.59, + "eval_loss": 0.9240958094596863, + "eval_runtime": 518.4809, + "eval_samples_per_second": 14.733, + "eval_wer": 0.33388604591326226, + "step": 51360 + }, + { + "epoch": 7.6, + "learning_rate": 6.224035608308606e-06, + "loss": 1.0244, + "step": 51400 + }, + { + "epoch": 7.6, + "eval_loss": 0.9180992841720581, + "eval_runtime": 520.7726, + "eval_samples_per_second": 14.669, + "eval_wer": 0.33337145144229396, + "step": 51400 + }, + { + "epoch": 7.6, + "learning_rate": 6.221068249258161e-06, + "loss": 0.9448, + "step": 51440 + }, + { + "epoch": 7.6, + "eval_loss": 0.9629867672920227, + "eval_runtime": 518.5766, + "eval_samples_per_second": 14.731, + "eval_wer": 0.336973612739072, + "step": 51440 + }, + { + "epoch": 7.61, + "learning_rate": 6.218100890207716e-06, + "loss": 0.9706, + "step": 51480 + }, + { + "epoch": 7.61, + "eval_loss": 0.9382863640785217, + "eval_runtime": 522.4388, + "eval_samples_per_second": 14.622, + "eval_wer": 0.33557277223476945, + "step": 51480 + }, + { + "epoch": 7.62, + "learning_rate": 6.21513353115727e-06, + "loss": 1.0039, + "step": 51520 + }, + { + "epoch": 7.62, + "eval_loss": 0.9513601660728455, + "eval_runtime": 520.5687, + "eval_samples_per_second": 14.674, + "eval_wer": 0.3367163155035879, + "step": 51520 + }, + { + "epoch": 7.62, + "learning_rate": 6.2121661721068245e-06, + "loss": 0.9788, + "step": 51560 + }, + { + "epoch": 7.62, + "eval_loss": 0.8911813497543335, + "eval_runtime": 520.5457, + "eval_samples_per_second": 14.675, + "eval_wer": 0.33154178221218444, + "step": 51560 + }, + { + "epoch": 7.63, + "learning_rate": 6.209198813056381e-06, + "loss": 1.0207, + "step": 51600 + }, + { + "epoch": 7.63, + "eval_loss": 0.9084755778312683, + "eval_runtime": 519.3292, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3332570971154121, + "step": 51600 + }, + { + "epoch": 7.63, + "learning_rate": 6.206231454005935e-06, + "loss": 0.9943, + "step": 51640 + }, + { + "epoch": 7.63, + "eval_loss": 0.9123982787132263, + "eval_runtime": 518.6245, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3332570971154121, + "step": 51640 + }, + { + "epoch": 7.64, + "learning_rate": 6.20326409495549e-06, + "loss": 1.0024, + "step": 51680 + }, + { + "epoch": 7.64, + "eval_loss": 0.9628497958183289, + "eval_runtime": 519.5674, + "eval_samples_per_second": 14.703, + "eval_wer": 0.3372594985562766, + "step": 51680 + }, + { + "epoch": 7.65, + "learning_rate": 6.200296735905045e-06, + "loss": 1.0777, + "step": 51720 + }, + { + "epoch": 7.65, + "eval_loss": 0.9197179079055786, + "eval_runtime": 524.522, + "eval_samples_per_second": 14.564, + "eval_wer": 0.3335715715143372, + "step": 51720 + }, + { + "epoch": 7.65, + "learning_rate": 6.197329376854599e-06, + "loss": 1.0669, + "step": 51760 + }, + { + "epoch": 7.65, + "eval_loss": 0.9119200706481934, + "eval_runtime": 520.4251, + "eval_samples_per_second": 14.678, + "eval_wer": 0.3332570971154121, + "step": 51760 + }, + { + "epoch": 7.66, + "learning_rate": 6.194362017804155e-06, + "loss": 0.9776, + "step": 51800 + }, + { + "epoch": 7.66, + "eval_loss": 0.948456883430481, + "eval_runtime": 519.1741, + "eval_samples_per_second": 14.714, + "eval_wer": 0.33651619543154465, + "step": 51800 + }, + { + "epoch": 7.66, + "learning_rate": 6.19139465875371e-06, + "loss": 1.1093, + "step": 51840 + }, + { + "epoch": 7.66, + "eval_loss": 0.9134979844093323, + "eval_runtime": 519.7495, + "eval_samples_per_second": 14.697, + "eval_wer": 0.33437205180251006, + "step": 51840 + }, + { + "epoch": 7.67, + "learning_rate": 6.188427299703264e-06, + "loss": 1.0656, + "step": 51880 + }, + { + "epoch": 7.67, + "eval_loss": 0.9108756184577942, + "eval_runtime": 520.9303, + "eval_samples_per_second": 14.664, + "eval_wer": 0.33437205180251006, + "step": 51880 + }, + { + "epoch": 7.67, + "learning_rate": 6.18545994065282e-06, + "loss": 0.969, + "step": 51920 + }, + { + "epoch": 7.67, + "eval_loss": 0.9390916228294373, + "eval_runtime": 519.0593, + "eval_samples_per_second": 14.717, + "eval_wer": 0.33605877812401724, + "step": 51920 + }, + { + "epoch": 7.68, + "learning_rate": 6.182492581602374e-06, + "loss": 0.9473, + "step": 51960 + }, + { + "epoch": 7.68, + "eval_loss": 0.9396269917488098, + "eval_runtime": 521.7036, + "eval_samples_per_second": 14.642, + "eval_wer": 0.33557277223476945, + "step": 51960 + }, + { + "epoch": 7.69, + "learning_rate": 6.17952522255193e-06, + "loss": 1.1213, + "step": 52000 + }, + { + "epoch": 7.69, + "eval_loss": 0.942671000957489, + "eval_runtime": 519.1157, + "eval_samples_per_second": 14.715, + "eval_wer": 0.33608736670573774, + "step": 52000 + }, + { + "epoch": 7.69, + "learning_rate": 6.176557863501485e-06, + "loss": 0.9753, + "step": 52040 + }, + { + "epoch": 7.69, + "eval_loss": 0.9247638583183289, + "eval_runtime": 519.1388, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3347437033648761, + "step": 52040 + }, + { + "epoch": 7.7, + "learning_rate": 6.173590504451039e-06, + "loss": 0.9582, + "step": 52080 + }, + { + "epoch": 7.7, + "eval_loss": 0.9556808471679688, + "eval_runtime": 518.4477, + "eval_samples_per_second": 14.734, + "eval_wer": 0.3363160753595014, + "step": 52080 + }, + { + "epoch": 7.7, + "learning_rate": 6.1706231454005935e-06, + "loss": 1.0331, + "step": 52120 + }, + { + "epoch": 7.7, + "eval_loss": 0.8891159892082214, + "eval_runtime": 520.8416, + "eval_samples_per_second": 14.667, + "eval_wer": 0.3317990794476686, + "step": 52120 + }, + { + "epoch": 7.71, + "learning_rate": 6.167655786350149e-06, + "loss": 1.0504, + "step": 52160 + }, + { + "epoch": 7.71, + "eval_loss": 0.9058249592781067, + "eval_runtime": 520.0726, + "eval_samples_per_second": 14.688, + "eval_wer": 0.33299979987992795, + "step": 52160 + }, + { + "epoch": 7.72, + "learning_rate": 6.164688427299704e-06, + "loss": 1.0137, + "step": 52200 + }, + { + "epoch": 7.72, + "eval_loss": 0.8907362222671509, + "eval_runtime": 519.1144, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3326853254810029, + "step": 52200 + }, + { + "epoch": 7.72, + "learning_rate": 6.161721068249259e-06, + "loss": 1.0241, + "step": 52240 + }, + { + "epoch": 7.72, + "eval_loss": 0.9164539575576782, + "eval_runtime": 519.7665, + "eval_samples_per_second": 14.697, + "eval_wer": 0.3337431030046599, + "step": 52240 + }, + { + "epoch": 7.73, + "learning_rate": 6.158753709198814e-06, + "loss": 0.9969, + "step": 52280 + }, + { + "epoch": 7.73, + "eval_loss": 0.9141135215759277, + "eval_runtime": 518.9521, + "eval_samples_per_second": 14.72, + "eval_wer": 0.33334286286057346, + "step": 52280 + }, + { + "epoch": 7.73, + "learning_rate": 6.155786350148368e-06, + "loss": 0.9862, + "step": 52320 + }, + { + "epoch": 7.73, + "eval_loss": 0.9178887605667114, + "eval_runtime": 522.8212, + "eval_samples_per_second": 14.611, + "eval_wer": 0.3331999199519712, + "step": 52320 + }, + { + "epoch": 7.74, + "learning_rate": 6.152818991097923e-06, + "loss": 1.0149, + "step": 52360 + }, + { + "epoch": 7.74, + "eval_loss": 0.9122446179389954, + "eval_runtime": 519.4921, + "eval_samples_per_second": 14.705, + "eval_wer": 0.33294262271648706, + "step": 52360 + }, + { + "epoch": 7.75, + "learning_rate": 6.149851632047478e-06, + "loss": 1.0022, + "step": 52400 + }, + { + "epoch": 7.75, + "eval_loss": 0.8836090564727783, + "eval_runtime": 519.0164, + "eval_samples_per_second": 14.718, + "eval_wer": 0.33008376454444094, + "step": 52400 + }, + { + "epoch": 7.75, + "learning_rate": 6.146884272997033e-06, + "loss": 1.0357, + "step": 52440 + }, + { + "epoch": 7.75, + "eval_loss": 0.9362127780914307, + "eval_runtime": 519.2495, + "eval_samples_per_second": 14.712, + "eval_wer": 0.33385745733154176, + "step": 52440 + }, + { + "epoch": 7.76, + "learning_rate": 6.1439169139465885e-06, + "loss": 0.9898, + "step": 52480 + }, + { + "epoch": 7.76, + "eval_loss": 0.9178655743598938, + "eval_runtime": 520.2439, + "eval_samples_per_second": 14.683, + "eval_wer": 0.3326853254810029, + "step": 52480 + }, + { + "epoch": 7.76, + "learning_rate": 6.140949554896143e-06, + "loss": 0.958, + "step": 52520 + }, + { + "epoch": 7.76, + "eval_loss": 0.9565437436103821, + "eval_runtime": 520.471, + "eval_samples_per_second": 14.677, + "eval_wer": 0.3352868864175648, + "step": 52520 + }, + { + "epoch": 7.77, + "learning_rate": 6.1379821958456974e-06, + "loss": 0.9775, + "step": 52560 + }, + { + "epoch": 7.77, + "eval_loss": 0.9389362335205078, + "eval_runtime": 519.1362, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3340861659853055, + "step": 52560 + }, + { + "epoch": 7.78, + "learning_rate": 6.135014836795252e-06, + "loss": 1.0062, + "step": 52600 + }, + { + "epoch": 7.78, + "eval_loss": 0.9822790622711182, + "eval_runtime": 520.8789, + "eval_samples_per_second": 14.666, + "eval_wer": 0.3372880871379971, + "step": 52600 + }, + { + "epoch": 7.78, + "learning_rate": 6.132047477744808e-06, + "loss": 0.9774, + "step": 52640 + }, + { + "epoch": 7.78, + "eval_loss": 0.9300295114517212, + "eval_runtime": 518.9146, + "eval_samples_per_second": 14.721, + "eval_wer": 0.3341433431487464, + "step": 52640 + }, + { + "epoch": 7.79, + "learning_rate": 6.1290801186943624e-06, + "loss": 1.0741, + "step": 52680 + }, + { + "epoch": 7.79, + "eval_loss": 0.9428894519805908, + "eval_runtime": 519.1882, + "eval_samples_per_second": 14.713, + "eval_wer": 0.33531547499928527, + "step": 52680 + }, + { + "epoch": 7.79, + "learning_rate": 6.126112759643918e-06, + "loss": 0.9765, + "step": 52720 + }, + { + "epoch": 7.79, + "eval_loss": 0.9397070407867432, + "eval_runtime": 520.4144, + "eval_samples_per_second": 14.679, + "eval_wer": 0.3349152348551988, + "step": 52720 + }, + { + "epoch": 7.8, + "learning_rate": 6.123145400593472e-06, + "loss": 0.9892, + "step": 52760 + }, + { + "epoch": 7.8, + "eval_loss": 0.9304806590080261, + "eval_runtime": 520.6411, + "eval_samples_per_second": 14.672, + "eval_wer": 0.33388604591326226, + "step": 52760 + }, + { + "epoch": 7.8, + "learning_rate": 6.120178041543027e-06, + "loss": 0.9704, + "step": 52800 + }, + { + "epoch": 7.8, + "eval_loss": 0.94686359167099, + "eval_runtime": 523.8778, + "eval_samples_per_second": 14.582, + "eval_wer": 0.3352868864175648, + "step": 52800 + }, + { + "epoch": 7.81, + "learning_rate": 6.117210682492583e-06, + "loss": 1.0201, + "step": 52840 + }, + { + "epoch": 7.81, + "eval_loss": 0.9114255905151367, + "eval_runtime": 519.3919, + "eval_samples_per_second": 14.708, + "eval_wer": 0.333314274278853, + "step": 52840 + }, + { + "epoch": 7.82, + "learning_rate": 6.114243323442137e-06, + "loss": 1.0411, + "step": 52880 + }, + { + "epoch": 7.82, + "eval_loss": 0.8975634574890137, + "eval_runtime": 519.352, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3323136739186369, + "step": 52880 + }, + { + "epoch": 7.82, + "learning_rate": 6.111275964391692e-06, + "loss": 1.0534, + "step": 52920 + }, + { + "epoch": 7.82, + "eval_loss": 0.9073917865753174, + "eval_runtime": 518.1439, + "eval_samples_per_second": 14.743, + "eval_wer": 0.3328854455530461, + "step": 52920 + }, + { + "epoch": 7.83, + "learning_rate": 6.108308605341247e-06, + "loss": 1.0327, + "step": 52960 + }, + { + "epoch": 7.83, + "eval_loss": 0.8746650815010071, + "eval_runtime": 517.8455, + "eval_samples_per_second": 14.752, + "eval_wer": 0.3302552960347637, + "step": 52960 + }, + { + "epoch": 7.83, + "learning_rate": 6.105341246290801e-06, + "loss": 1.0306, + "step": 53000 + }, + { + "epoch": 7.83, + "eval_loss": 0.8979204893112183, + "eval_runtime": 518.7583, + "eval_samples_per_second": 14.726, + "eval_wer": 0.33205637668315274, + "step": 53000 + }, + { + "epoch": 7.84, + "learning_rate": 6.102373887240357e-06, + "loss": 1.0362, + "step": 53040 + }, + { + "epoch": 7.84, + "eval_loss": 0.8609880208969116, + "eval_runtime": 520.1154, + "eval_samples_per_second": 14.687, + "eval_wer": 0.3307127133422911, + "step": 53040 + }, + { + "epoch": 7.85, + "learning_rate": 6.099406528189912e-06, + "loss": 1.0352, + "step": 53080 + }, + { + "epoch": 7.85, + "eval_loss": 0.8837307691574097, + "eval_runtime": 518.6463, + "eval_samples_per_second": 14.729, + "eval_wer": 0.33094142199605475, + "step": 53080 + }, + { + "epoch": 7.85, + "learning_rate": 6.096439169139466e-06, + "loss": 0.9803, + "step": 53120 + }, + { + "epoch": 7.85, + "eval_loss": 0.8962290287017822, + "eval_runtime": 518.6161, + "eval_samples_per_second": 14.73, + "eval_wer": 0.3313416621401412, + "step": 53120 + }, + { + "epoch": 7.86, + "learning_rate": 6.093471810089021e-06, + "loss": 1.0335, + "step": 53160 + }, + { + "epoch": 7.86, + "eval_loss": 0.8745282292366028, + "eval_runtime": 519.0043, + "eval_samples_per_second": 14.719, + "eval_wer": 0.3303124731982046, + "step": 53160 + }, + { + "epoch": 7.86, + "learning_rate": 6.090504451038576e-06, + "loss": 0.9947, + "step": 53200 + }, + { + "epoch": 7.86, + "eval_loss": 0.9225924611091614, + "eval_runtime": 518.0721, + "eval_samples_per_second": 14.745, + "eval_wer": 0.33265673689928243, + "step": 53200 + }, + { + "epoch": 7.87, + "learning_rate": 6.087537091988131e-06, + "loss": 0.9613, + "step": 53240 + }, + { + "epoch": 7.87, + "eval_loss": 0.9433957934379578, + "eval_runtime": 519.1778, + "eval_samples_per_second": 14.714, + "eval_wer": 0.3346579376197147, + "step": 53240 + }, + { + "epoch": 7.88, + "learning_rate": 6.084569732937686e-06, + "loss": 1.0077, + "step": 53280 + }, + { + "epoch": 7.88, + "eval_loss": 0.9143416881561279, + "eval_runtime": 519.5039, + "eval_samples_per_second": 14.704, + "eval_wer": 0.3332570971154121, + "step": 53280 + }, + { + "epoch": 7.88, + "learning_rate": 6.081602373887241e-06, + "loss": 0.9941, + "step": 53320 + }, + { + "epoch": 7.88, + "eval_loss": 0.9404259920120239, + "eval_runtime": 519.9775, + "eval_samples_per_second": 14.691, + "eval_wer": 0.334429228965951, + "step": 53320 + }, + { + "epoch": 7.89, + "learning_rate": 6.078635014836796e-06, + "loss": 1.0474, + "step": 53360 + }, + { + "epoch": 7.89, + "eval_loss": 0.8661729097366333, + "eval_runtime": 517.4935, + "eval_samples_per_second": 14.762, + "eval_wer": 0.3298264673089568, + "step": 53360 + }, + { + "epoch": 7.89, + "learning_rate": 6.07566765578635e-06, + "loss": 1.0666, + "step": 53400 + }, + { + "epoch": 7.89, + "eval_loss": 0.9005254507064819, + "eval_runtime": 524.0414, + "eval_samples_per_second": 14.577, + "eval_wer": 0.33182766802938907, + "step": 53400 + }, + { + "epoch": 7.9, + "learning_rate": 6.072700296735905e-06, + "loss": 1.0224, + "step": 53440 + }, + { + "epoch": 7.9, + "eval_loss": 0.8804164528846741, + "eval_runtime": 519.2458, + "eval_samples_per_second": 14.712, + "eval_wer": 0.33036965036164556, + "step": 53440 + }, + { + "epoch": 7.91, + "learning_rate": 6.069732937685461e-06, + "loss": 1.0093, + "step": 53480 + }, + { + "epoch": 7.91, + "eval_loss": 0.9416154026985168, + "eval_runtime": 520.9355, + "eval_samples_per_second": 14.664, + "eval_wer": 0.3353726521627262, + "step": 53480 + }, + { + "epoch": 7.91, + "learning_rate": 6.066765578635016e-06, + "loss": 0.9504, + "step": 53520 + }, + { + "epoch": 7.91, + "eval_loss": 0.9449346661567688, + "eval_runtime": 518.208, + "eval_samples_per_second": 14.741, + "eval_wer": 0.33520112067240343, + "step": 53520 + }, + { + "epoch": 7.92, + "learning_rate": 6.06379821958457e-06, + "loss": 1.0073, + "step": 53560 + }, + { + "epoch": 7.92, + "eval_loss": 0.9140265583992004, + "eval_runtime": 518.6623, + "eval_samples_per_second": 14.728, + "eval_wer": 0.3323708510820778, + "step": 53560 + }, + { + "epoch": 7.92, + "learning_rate": 6.060830860534125e-06, + "loss": 1.0057, + "step": 53600 + }, + { + "epoch": 7.92, + "eval_loss": 0.9610195755958557, + "eval_runtime": 520.6532, + "eval_samples_per_second": 14.672, + "eval_wer": 0.3359444237971354, + "step": 53600 + }, + { + "epoch": 7.93, + "learning_rate": 6.057863501483679e-06, + "loss": 0.9963, + "step": 53640 + }, + { + "epoch": 7.93, + "eval_loss": 0.9419493079185486, + "eval_runtime": 520.28, + "eval_samples_per_second": 14.682, + "eval_wer": 0.33380028016810087, + "step": 53640 + }, + { + "epoch": 7.93, + "learning_rate": 6.054896142433235e-06, + "loss": 0.9722, + "step": 53680 + }, + { + "epoch": 7.93, + "eval_loss": 0.9281905293464661, + "eval_runtime": 519.4816, + "eval_samples_per_second": 14.705, + "eval_wer": 0.33282826838960516, + "step": 53680 + }, + { + "epoch": 7.94, + "learning_rate": 6.05192878338279e-06, + "loss": 1.077, + "step": 53720 + }, + { + "epoch": 7.94, + "eval_loss": 0.9114858508110046, + "eval_runtime": 520.0796, + "eval_samples_per_second": 14.688, + "eval_wer": 0.33162754795734584, + "step": 53720 + }, + { + "epoch": 7.95, + "learning_rate": 6.048961424332345e-06, + "loss": 1.0097, + "step": 53760 + }, + { + "epoch": 7.95, + "eval_loss": 0.9414505958557129, + "eval_runtime": 519.7392, + "eval_samples_per_second": 14.698, + "eval_wer": 0.3337716915863804, + "step": 53760 + }, + { + "epoch": 7.95, + "learning_rate": 6.0459940652818995e-06, + "loss": 1.022, + "step": 53800 + }, + { + "epoch": 7.95, + "eval_loss": 0.9282048940658569, + "eval_runtime": 519.3293, + "eval_samples_per_second": 14.709, + "eval_wer": 0.332628148317562, + "step": 53800 + }, + { + "epoch": 7.96, + "learning_rate": 6.043026706231454e-06, + "loss": 1.0066, + "step": 53840 + }, + { + "epoch": 7.96, + "eval_loss": 0.9492064714431763, + "eval_runtime": 518.2481, + "eval_samples_per_second": 14.74, + "eval_wer": 0.33411475456702594, + "step": 53840 + }, + { + "epoch": 7.96, + "learning_rate": 6.04005934718101e-06, + "loss": 1.0276, + "step": 53880 + }, + { + "epoch": 7.96, + "eval_loss": 0.9397733807563782, + "eval_runtime": 520.2387, + "eval_samples_per_second": 14.684, + "eval_wer": 0.33265673689928243, + "step": 53880 + }, + { + "epoch": 7.97, + "learning_rate": 6.0370919881305645e-06, + "loss": 1.0596, + "step": 53920 + }, + { + "epoch": 7.97, + "eval_loss": 0.9083213806152344, + "eval_runtime": 519.6244, + "eval_samples_per_second": 14.701, + "eval_wer": 0.33094142199605475, + "step": 53920 + }, + { + "epoch": 7.98, + "learning_rate": 6.034124629080119e-06, + "loss": 0.9448, + "step": 53960 + }, + { + "epoch": 7.98, + "eval_loss": 0.9528515338897705, + "eval_runtime": 519.1287, + "eval_samples_per_second": 14.715, + "eval_wer": 0.33337145144229396, + "step": 53960 + }, + { + "epoch": 7.98, + "learning_rate": 6.031157270029674e-06, + "loss": 1.0592, + "step": 54000 + }, + { + "epoch": 7.98, + "eval_loss": 0.9260146021842957, + "eval_runtime": 519.4402, + "eval_samples_per_second": 14.706, + "eval_wer": 0.3317990794476686, + "step": 54000 + }, + { + "epoch": 7.99, + "learning_rate": 6.028189910979229e-06, + "loss": 0.9947, + "step": 54040 + }, + { + "epoch": 7.99, + "eval_loss": 0.9357885718345642, + "eval_runtime": 518.6206, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3327425026444438, + "step": 54040 + }, + { + "epoch": 7.99, + "learning_rate": 6.025222551928784e-06, + "loss": 1.0663, + "step": 54080 + }, + { + "epoch": 7.99, + "eval_loss": 0.927927553653717, + "eval_runtime": 519.1374, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3327710912261643, + "step": 54080 + }, + { + "epoch": 8.0, + "learning_rate": 6.022255192878339e-06, + "loss": 0.8682, + "step": 54120 + }, + { + "epoch": 8.0, + "eval_loss": 0.9807685613632202, + "eval_runtime": 518.1119, + "eval_samples_per_second": 14.744, + "eval_wer": 0.3374024414648789, + "step": 54120 + }, + { + "epoch": 8.01, + "learning_rate": 6.019287833827894e-06, + "loss": 1.0178, + "step": 54160 + }, + { + "epoch": 8.01, + "eval_loss": 0.9910249710083008, + "eval_runtime": 517.0469, + "eval_samples_per_second": 14.774, + "eval_wer": 0.33780268160896537, + "step": 54160 + }, + { + "epoch": 8.01, + "learning_rate": 6.016320474777448e-06, + "loss": 0.9727, + "step": 54200 + }, + { + "epoch": 8.01, + "eval_loss": 0.9268185496330261, + "eval_runtime": 518.2728, + "eval_samples_per_second": 14.739, + "eval_wer": 0.3325137939906801, + "step": 54200 + }, + { + "epoch": 8.02, + "learning_rate": 6.0133531157270035e-06, + "loss": 0.9928, + "step": 54240 + }, + { + "epoch": 8.02, + "eval_loss": 0.9080156683921814, + "eval_runtime": 523.7201, + "eval_samples_per_second": 14.586, + "eval_wer": 0.33182766802938907, + "step": 54240 + }, + { + "epoch": 8.02, + "learning_rate": 6.010385756676559e-06, + "loss": 0.9747, + "step": 54280 + }, + { + "epoch": 8.02, + "eval_loss": 0.9629383087158203, + "eval_runtime": 517.8587, + "eval_samples_per_second": 14.751, + "eval_wer": 0.335172532090683, + "step": 54280 + }, + { + "epoch": 8.03, + "learning_rate": 6.007418397626113e-06, + "loss": 1.004, + "step": 54320 + }, + { + "epoch": 8.03, + "eval_loss": 0.9308258295059204, + "eval_runtime": 519.0444, + "eval_samples_per_second": 14.717, + "eval_wer": 0.33257097115412104, + "step": 54320 + }, + { + "epoch": 8.04, + "learning_rate": 6.0044510385756685e-06, + "loss": 1.0673, + "step": 54360 + }, + { + "epoch": 8.04, + "eval_loss": 0.9033301472663879, + "eval_runtime": 518.5143, + "eval_samples_per_second": 14.732, + "eval_wer": 0.3301123531261614, + "step": 54360 + }, + { + "epoch": 8.04, + "learning_rate": 6.001483679525223e-06, + "loss": 1.0225, + "step": 54400 + }, + { + "epoch": 8.04, + "eval_loss": 0.9338165521621704, + "eval_runtime": 519.0166, + "eval_samples_per_second": 14.718, + "eval_wer": 0.33308556562508934, + "step": 54400 + }, + { + "epoch": 8.05, + "learning_rate": 5.998516320474777e-06, + "loss": 0.9509, + "step": 54440 + }, + { + "epoch": 8.05, + "eval_loss": 0.9833784699440002, + "eval_runtime": 519.5542, + "eval_samples_per_second": 14.703, + "eval_wer": 0.33665913834014694, + "step": 54440 + }, + { + "epoch": 8.05, + "learning_rate": 5.995548961424333e-06, + "loss": 0.9988, + "step": 54480 + }, + { + "epoch": 8.05, + "eval_loss": 0.8862904906272888, + "eval_runtime": 518.368, + "eval_samples_per_second": 14.737, + "eval_wer": 0.3284256268046542, + "step": 54480 + }, + { + "epoch": 8.06, + "learning_rate": 5.992581602373888e-06, + "loss": 0.9794, + "step": 54520 + }, + { + "epoch": 8.06, + "eval_loss": 0.9186516404151917, + "eval_runtime": 518.5361, + "eval_samples_per_second": 14.732, + "eval_wer": 0.33105577632293665, + "step": 54520 + }, + { + "epoch": 8.07, + "learning_rate": 5.989614243323442e-06, + "loss": 0.9576, + "step": 54560 + }, + { + "epoch": 8.07, + "eval_loss": 0.9740708470344543, + "eval_runtime": 517.4858, + "eval_samples_per_second": 14.762, + "eval_wer": 0.33562994939821034, + "step": 54560 + }, + { + "epoch": 8.07, + "learning_rate": 5.986646884272998e-06, + "loss": 1.0373, + "step": 54600 + }, + { + "epoch": 8.07, + "eval_loss": 0.9146999716758728, + "eval_runtime": 522.0886, + "eval_samples_per_second": 14.632, + "eval_wer": 0.33162754795734584, + "step": 54600 + }, + { + "epoch": 8.08, + "learning_rate": 5.983679525222552e-06, + "loss": 1.0139, + "step": 54640 + }, + { + "epoch": 8.08, + "eval_loss": 0.9584102630615234, + "eval_runtime": 518.1006, + "eval_samples_per_second": 14.744, + "eval_wer": 0.335172532090683, + "step": 54640 + }, + { + "epoch": 8.08, + "learning_rate": 5.9807121661721066e-06, + "loss": 0.9856, + "step": 54680 + }, + { + "epoch": 8.08, + "eval_loss": 0.9371985793113708, + "eval_runtime": 517.3078, + "eval_samples_per_second": 14.767, + "eval_wer": 0.3339718116584236, + "step": 54680 + }, + { + "epoch": 8.09, + "learning_rate": 5.977744807121663e-06, + "loss": 0.9653, + "step": 54720 + }, + { + "epoch": 8.09, + "eval_loss": 1.0169464349746704, + "eval_runtime": 518.626, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3412333114154207, + "step": 54720 + }, + { + "epoch": 8.09, + "learning_rate": 5.974777448071217e-06, + "loss": 1.0847, + "step": 54760 + }, + { + "epoch": 8.09, + "eval_loss": 0.9586917757987976, + "eval_runtime": 518.9961, + "eval_samples_per_second": 14.719, + "eval_wer": 0.3368020812487493, + "step": 54760 + }, + { + "epoch": 8.1, + "learning_rate": 5.971810089020772e-06, + "loss": 0.9641, + "step": 54800 + }, + { + "epoch": 8.1, + "eval_loss": 0.9320694804191589, + "eval_runtime": 517.4176, + "eval_samples_per_second": 14.764, + "eval_wer": 0.334429228965951, + "step": 54800 + }, + { + "epoch": 8.11, + "learning_rate": 5.968842729970327e-06, + "loss": 0.9631, + "step": 54840 + }, + { + "epoch": 8.11, + "eval_loss": 0.8968454003334045, + "eval_runtime": 518.4896, + "eval_samples_per_second": 14.733, + "eval_wer": 0.33097001057777525, + "step": 54840 + }, + { + "epoch": 8.11, + "learning_rate": 5.965875370919881e-06, + "loss": 1.0437, + "step": 54880 + }, + { + "epoch": 8.11, + "eval_loss": 0.9382304549217224, + "eval_runtime": 518.1116, + "eval_samples_per_second": 14.744, + "eval_wer": 0.33417193173046683, + "step": 54880 + }, + { + "epoch": 8.12, + "learning_rate": 5.9629080118694375e-06, + "loss": 0.9824, + "step": 54920 + }, + { + "epoch": 8.12, + "eval_loss": 0.9467187523841858, + "eval_runtime": 518.0731, + "eval_samples_per_second": 14.745, + "eval_wer": 0.3352297092541239, + "step": 54920 + }, + { + "epoch": 8.12, + "learning_rate": 5.959940652818992e-06, + "loss": 0.9637, + "step": 54960 + }, + { + "epoch": 8.12, + "eval_loss": 0.9337650537490845, + "eval_runtime": 519.2953, + "eval_samples_per_second": 14.71, + "eval_wer": 0.3334858057691758, + "step": 54960 + }, + { + "epoch": 8.13, + "learning_rate": 5.956973293768546e-06, + "loss": 0.8906, + "step": 55000 + }, + { + "epoch": 8.13, + "eval_loss": 0.9389777183532715, + "eval_runtime": 518.7921, + "eval_samples_per_second": 14.725, + "eval_wer": 0.33342862860573486, + "step": 55000 + }, + { + "epoch": 8.14, + "learning_rate": 5.954005934718101e-06, + "loss": 1.0066, + "step": 55040 + }, + { + "epoch": 8.14, + "eval_loss": 0.9180696606636047, + "eval_runtime": 518.4872, + "eval_samples_per_second": 14.733, + "eval_wer": 0.33068412476057063, + "step": 55040 + }, + { + "epoch": 8.14, + "learning_rate": 5.951038575667656e-06, + "loss": 0.9818, + "step": 55080 + }, + { + "epoch": 8.14, + "eval_loss": 0.9195407629013062, + "eval_runtime": 521.0114, + "eval_samples_per_second": 14.662, + "eval_wer": 0.3311701306498185, + "step": 55080 + }, + { + "epoch": 8.15, + "learning_rate": 5.948071216617211e-06, + "loss": 1.0012, + "step": 55120 + }, + { + "epoch": 8.15, + "eval_loss": 0.9449203610420227, + "eval_runtime": 520.0753, + "eval_samples_per_second": 14.688, + "eval_wer": 0.3327139140627233, + "step": 55120 + }, + { + "epoch": 8.15, + "learning_rate": 5.945103857566767e-06, + "loss": 0.9565, + "step": 55160 + }, + { + "epoch": 8.15, + "eval_loss": 0.9606163501739502, + "eval_runtime": 518.2504, + "eval_samples_per_second": 14.74, + "eval_wer": 0.333314274278853, + "step": 55160 + }, + { + "epoch": 8.16, + "learning_rate": 5.942136498516321e-06, + "loss": 0.9488, + "step": 55200 + }, + { + "epoch": 8.16, + "eval_loss": 0.9426321983337402, + "eval_runtime": 523.9584, + "eval_samples_per_second": 14.579, + "eval_wer": 0.3317704908659481, + "step": 55200 + }, + { + "epoch": 8.17, + "learning_rate": 5.9391691394658755e-06, + "loss": 0.998, + "step": 55240 + }, + { + "epoch": 8.17, + "eval_loss": 0.9236483573913574, + "eval_runtime": 518.1984, + "eval_samples_per_second": 14.741, + "eval_wer": 0.331141542068098, + "step": 55240 + }, + { + "epoch": 8.17, + "learning_rate": 5.93620178041543e-06, + "loss": 0.9986, + "step": 55280 + }, + { + "epoch": 8.17, + "eval_loss": 0.9055008888244629, + "eval_runtime": 519.6291, + "eval_samples_per_second": 14.701, + "eval_wer": 0.33054118185196835, + "step": 55280 + }, + { + "epoch": 8.18, + "learning_rate": 5.933234421364986e-06, + "loss": 1.0164, + "step": 55320 + }, + { + "epoch": 8.18, + "eval_loss": 0.9060313701629639, + "eval_runtime": 519.2682, + "eval_samples_per_second": 14.711, + "eval_wer": 0.33105577632293665, + "step": 55320 + }, + { + "epoch": 8.18, + "learning_rate": 5.9302670623145405e-06, + "loss": 0.9865, + "step": 55360 + }, + { + "epoch": 8.18, + "eval_loss": 0.9024366736412048, + "eval_runtime": 518.7055, + "eval_samples_per_second": 14.727, + "eval_wer": 0.3301409417078819, + "step": 55360 + }, + { + "epoch": 8.19, + "learning_rate": 5.927299703264096e-06, + "loss": 0.9828, + "step": 55400 + }, + { + "epoch": 8.19, + "eval_loss": 0.9337038993835449, + "eval_runtime": 519.8668, + "eval_samples_per_second": 14.694, + "eval_wer": 0.33257097115412104, + "step": 55400 + }, + { + "epoch": 8.2, + "learning_rate": 5.92433234421365e-06, + "loss": 1.0372, + "step": 55440 + }, + { + "epoch": 8.2, + "eval_loss": 0.9524915814399719, + "eval_runtime": 519.3956, + "eval_samples_per_second": 14.707, + "eval_wer": 0.33345721718745536, + "step": 55440 + }, + { + "epoch": 8.2, + "learning_rate": 5.921364985163205e-06, + "loss": 1.1036, + "step": 55480 + }, + { + "epoch": 8.2, + "eval_loss": 0.8830329775810242, + "eval_runtime": 519.5369, + "eval_samples_per_second": 14.703, + "eval_wer": 0.32942622716487036, + "step": 55480 + }, + { + "epoch": 8.21, + "learning_rate": 5.918397626112759e-06, + "loss": 1.006, + "step": 55520 + }, + { + "epoch": 8.21, + "eval_loss": 0.9073262810707092, + "eval_runtime": 518.6344, + "eval_samples_per_second": 14.729, + "eval_wer": 0.3304840046885274, + "step": 55520 + }, + { + "epoch": 8.21, + "learning_rate": 5.915430267062315e-06, + "loss": 0.9736, + "step": 55560 + }, + { + "epoch": 8.21, + "eval_loss": 0.9118548631668091, + "eval_runtime": 518.6247, + "eval_samples_per_second": 14.729, + "eval_wer": 0.33028388461648417, + "step": 55560 + }, + { + "epoch": 8.22, + "learning_rate": 5.91246290801187e-06, + "loss": 0.9721, + "step": 55600 + }, + { + "epoch": 8.22, + "eval_loss": 0.9138809442520142, + "eval_runtime": 518.8548, + "eval_samples_per_second": 14.723, + "eval_wer": 0.3309985991594957, + "step": 55600 + }, + { + "epoch": 8.22, + "learning_rate": 5.909495548961425e-06, + "loss": 0.9419, + "step": 55640 + }, + { + "epoch": 8.22, + "eval_loss": 0.9358281493186951, + "eval_runtime": 519.9766, + "eval_samples_per_second": 14.691, + "eval_wer": 0.3318562566111095, + "step": 55640 + }, + { + "epoch": 8.23, + "learning_rate": 5.9065281899109795e-06, + "loss": 0.9756, + "step": 55680 + }, + { + "epoch": 8.23, + "eval_loss": 0.9191535711288452, + "eval_runtime": 520.2189, + "eval_samples_per_second": 14.684, + "eval_wer": 0.3312273078132594, + "step": 55680 + }, + { + "epoch": 8.24, + "learning_rate": 5.903560830860534e-06, + "loss": 0.9704, + "step": 55720 + }, + { + "epoch": 8.24, + "eval_loss": 0.9552555084228516, + "eval_runtime": 519.2002, + "eval_samples_per_second": 14.713, + "eval_wer": 0.33471511478315563, + "step": 55720 + }, + { + "epoch": 8.24, + "learning_rate": 5.90059347181009e-06, + "loss": 1.028, + "step": 55760 + }, + { + "epoch": 8.24, + "eval_loss": 0.9229303002357483, + "eval_runtime": 521.3422, + "eval_samples_per_second": 14.653, + "eval_wer": 0.3313702507218617, + "step": 55760 + }, + { + "epoch": 8.25, + "learning_rate": 5.8976261127596445e-06, + "loss": 0.9973, + "step": 55800 + }, + { + "epoch": 8.25, + "eval_loss": 0.9124132990837097, + "eval_runtime": 523.8259, + "eval_samples_per_second": 14.583, + "eval_wer": 0.3309985991594957, + "step": 55800 + }, + { + "epoch": 8.25, + "learning_rate": 5.894658753709199e-06, + "loss": 1.0245, + "step": 55840 + }, + { + "epoch": 8.25, + "eval_loss": 0.9190382957458496, + "eval_runtime": 524.8448, + "eval_samples_per_second": 14.555, + "eval_wer": 0.33148460504874355, + "step": 55840 + }, + { + "epoch": 8.26, + "learning_rate": 5.891691394658754e-06, + "loss": 0.9874, + "step": 55880 + }, + { + "epoch": 8.26, + "eval_loss": 0.9476956725120544, + "eval_runtime": 524.0648, + "eval_samples_per_second": 14.576, + "eval_wer": 0.3330569770433689, + "step": 55880 + }, + { + "epoch": 8.27, + "learning_rate": 5.888724035608309e-06, + "loss": 1.0695, + "step": 55920 + }, + { + "epoch": 8.27, + "eval_loss": 0.8817742466926575, + "eval_runtime": 524.0231, + "eval_samples_per_second": 14.578, + "eval_wer": 0.3291117527659453, + "step": 55920 + }, + { + "epoch": 8.27, + "learning_rate": 5.885756676557865e-06, + "loss": 1.0507, + "step": 55960 + }, + { + "epoch": 8.27, + "eval_loss": 0.8866465091705322, + "eval_runtime": 528.2541, + "eval_samples_per_second": 14.461, + "eval_wer": 0.32925469567454757, + "step": 55960 + }, + { + "epoch": 8.28, + "learning_rate": 5.882789317507419e-06, + "loss": 1.0185, + "step": 56000 + }, + { + "epoch": 8.28, + "eval_loss": 0.9166718125343323, + "eval_runtime": 528.5367, + "eval_samples_per_second": 14.453, + "eval_wer": 0.3313702507218617, + "step": 56000 + }, + { + "epoch": 8.28, + "learning_rate": 5.879821958456974e-06, + "loss": 1.0058, + "step": 56040 + }, + { + "epoch": 8.28, + "eval_loss": 0.8898577094078064, + "eval_runtime": 524.3905, + "eval_samples_per_second": 14.567, + "eval_wer": 0.32914034134766573, + "step": 56040 + }, + { + "epoch": 8.29, + "learning_rate": 5.876854599406528e-06, + "loss": 0.9862, + "step": 56080 + }, + { + "epoch": 8.29, + "eval_loss": 0.8976664543151855, + "eval_runtime": 527.4166, + "eval_samples_per_second": 14.484, + "eval_wer": 0.32891163269390206, + "step": 56080 + }, + { + "epoch": 8.3, + "learning_rate": 5.873887240356083e-06, + "loss": 1.0068, + "step": 56120 + }, + { + "epoch": 8.3, + "eval_loss": 0.886381983757019, + "eval_runtime": 526.0566, + "eval_samples_per_second": 14.521, + "eval_wer": 0.32731067211755627, + "step": 56120 + }, + { + "epoch": 8.3, + "learning_rate": 5.870919881305639e-06, + "loss": 1.0202, + "step": 56160 + }, + { + "epoch": 8.3, + "eval_loss": 0.9239830374717712, + "eval_runtime": 524.5252, + "eval_samples_per_second": 14.564, + "eval_wer": 0.3306555361788502, + "step": 56160 + }, + { + "epoch": 8.31, + "learning_rate": 5.867952522255194e-06, + "loss": 1.0074, + "step": 56200 + }, + { + "epoch": 8.31, + "eval_loss": 0.9119540452957153, + "eval_runtime": 525.304, + "eval_samples_per_second": 14.542, + "eval_wer": 0.3296263472369136, + "step": 56200 + }, + { + "epoch": 8.31, + "learning_rate": 5.8649851632047484e-06, + "loss": 0.9895, + "step": 56240 + }, + { + "epoch": 8.31, + "eval_loss": 0.8701897859573364, + "eval_runtime": 526.1752, + "eval_samples_per_second": 14.518, + "eval_wer": 0.3253666485605649, + "step": 56240 + }, + { + "epoch": 8.32, + "learning_rate": 5.862017804154303e-06, + "loss": 1.1077, + "step": 56280 + }, + { + "epoch": 8.32, + "eval_loss": 0.8419491052627563, + "eval_runtime": 525.5205, + "eval_samples_per_second": 14.536, + "eval_wer": 0.3251665284885217, + "step": 56280 + }, + { + "epoch": 8.33, + "learning_rate": 5.859050445103857e-06, + "loss": 0.9847, + "step": 56320 + }, + { + "epoch": 8.33, + "eval_loss": 0.9195114374160767, + "eval_runtime": 527.4362, + "eval_samples_per_second": 14.483, + "eval_wer": 0.3299694102175591, + "step": 56320 + }, + { + "epoch": 8.33, + "learning_rate": 5.8560830860534135e-06, + "loss": 0.994, + "step": 56360 + }, + { + "epoch": 8.33, + "eval_loss": 0.8926817774772644, + "eval_runtime": 525.1788, + "eval_samples_per_second": 14.546, + "eval_wer": 0.327853855170245, + "step": 56360 + }, + { + "epoch": 8.34, + "learning_rate": 5.853115727002968e-06, + "loss": 0.9308, + "step": 56400 + }, + { + "epoch": 8.34, + "eval_loss": 0.9169015884399414, + "eval_runtime": 522.9119, + "eval_samples_per_second": 14.609, + "eval_wer": 0.3291975185111067, + "step": 56400 + }, + { + "epoch": 8.34, + "learning_rate": 5.850148367952523e-06, + "loss": 1.0194, + "step": 56440 + }, + { + "epoch": 8.34, + "eval_loss": 0.8959879279136658, + "eval_runtime": 521.5275, + "eval_samples_per_second": 14.647, + "eval_wer": 0.32831127247777236, + "step": 56440 + }, + { + "epoch": 8.35, + "learning_rate": 5.847181008902078e-06, + "loss": 0.9599, + "step": 56480 + }, + { + "epoch": 8.35, + "eval_loss": 0.9083085656166077, + "eval_runtime": 519.4548, + "eval_samples_per_second": 14.706, + "eval_wer": 0.3282826838960519, + "step": 56480 + }, + { + "epoch": 8.35, + "learning_rate": 5.844213649851632e-06, + "loss": 0.9996, + "step": 56520 + }, + { + "epoch": 8.35, + "eval_loss": 0.9500752687454224, + "eval_runtime": 521.3567, + "eval_samples_per_second": 14.652, + "eval_wer": 0.33154178221218444, + "step": 56520 + }, + { + "epoch": 8.36, + "learning_rate": 5.8412462908011865e-06, + "loss": 0.9857, + "step": 56560 + }, + { + "epoch": 8.36, + "eval_loss": 0.936362624168396, + "eval_runtime": 521.3869, + "eval_samples_per_second": 14.651, + "eval_wer": 0.32976929014551587, + "step": 56560 + }, + { + "epoch": 8.37, + "learning_rate": 5.838278931750743e-06, + "loss": 1.0368, + "step": 56600 + }, + { + "epoch": 8.37, + "eval_loss": 0.9017354249954224, + "eval_runtime": 519.6483, + "eval_samples_per_second": 14.7, + "eval_wer": 0.3282826838960519, + "step": 56600 + }, + { + "epoch": 8.37, + "learning_rate": 5.835311572700297e-06, + "loss": 1.0731, + "step": 56640 + }, + { + "epoch": 8.37, + "eval_loss": 0.9326215982437134, + "eval_runtime": 520.337, + "eval_samples_per_second": 14.681, + "eval_wer": 0.33051259327024785, + "step": 56640 + }, + { + "epoch": 8.38, + "learning_rate": 5.832344213649852e-06, + "loss": 0.9769, + "step": 56680 + }, + { + "epoch": 8.38, + "eval_loss": 0.9174826145172119, + "eval_runtime": 520.2834, + "eval_samples_per_second": 14.682, + "eval_wer": 0.32899739843906345, + "step": 56680 + }, + { + "epoch": 8.38, + "learning_rate": 5.829376854599407e-06, + "loss": 1.0009, + "step": 56720 + }, + { + "epoch": 8.38, + "eval_loss": 0.9340432286262512, + "eval_runtime": 519.7992, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3302267074530433, + "step": 56720 + }, + { + "epoch": 8.39, + "learning_rate": 5.826409495548961e-06, + "loss": 0.9996, + "step": 56760 + }, + { + "epoch": 8.39, + "eval_loss": 0.9342213273048401, + "eval_runtime": 520.6038, + "eval_samples_per_second": 14.673, + "eval_wer": 0.3303410617799251, + "step": 56760 + }, + { + "epoch": 8.4, + "learning_rate": 5.823442136498517e-06, + "loss": 0.9266, + "step": 56800 + }, + { + "epoch": 8.4, + "eval_loss": 0.8999951481819153, + "eval_runtime": 520.9142, + "eval_samples_per_second": 14.665, + "eval_wer": 0.3281683295691701, + "step": 56800 + }, + { + "epoch": 8.4, + "learning_rate": 5.820474777448072e-06, + "loss": 0.96, + "step": 56840 + }, + { + "epoch": 8.4, + "eval_loss": 0.9408696889877319, + "eval_runtime": 520.5035, + "eval_samples_per_second": 14.676, + "eval_wer": 0.33094142199605475, + "step": 56840 + }, + { + "epoch": 8.41, + "learning_rate": 5.817507418397626e-06, + "loss": 0.9838, + "step": 56880 + }, + { + "epoch": 8.41, + "eval_loss": 0.9568617343902588, + "eval_runtime": 518.8737, + "eval_samples_per_second": 14.722, + "eval_wer": 0.3323708510820778, + "step": 56880 + }, + { + "epoch": 8.41, + "learning_rate": 5.8145400593471816e-06, + "loss": 1.0314, + "step": 56920 + }, + { + "epoch": 8.41, + "eval_loss": 0.9070338010787964, + "eval_runtime": 519.0651, + "eval_samples_per_second": 14.717, + "eval_wer": 0.32891163269390206, + "step": 56920 + }, + { + "epoch": 8.42, + "learning_rate": 5.811572700296736e-06, + "loss": 0.9666, + "step": 56960 + }, + { + "epoch": 8.42, + "eval_loss": 0.9046706557273865, + "eval_runtime": 519.4014, + "eval_samples_per_second": 14.707, + "eval_wer": 0.3287115126218588, + "step": 56960 + }, + { + "epoch": 8.43, + "learning_rate": 5.808605341246291e-06, + "loss": 0.9861, + "step": 57000 + }, + { + "epoch": 8.43, + "eval_loss": 0.9242555499076843, + "eval_runtime": 519.343, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3301409417078819, + "step": 57000 + }, + { + "epoch": 8.43, + "learning_rate": 5.805637982195847e-06, + "loss": 0.9462, + "step": 57040 + }, + { + "epoch": 8.43, + "eval_loss": 0.9536969065666199, + "eval_runtime": 519.6794, + "eval_samples_per_second": 14.699, + "eval_wer": 0.331513193630464, + "step": 57040 + }, + { + "epoch": 8.44, + "learning_rate": 5.802670623145401e-06, + "loss": 1.0011, + "step": 57080 + }, + { + "epoch": 8.44, + "eval_loss": 0.924984872341156, + "eval_runtime": 519.8407, + "eval_samples_per_second": 14.695, + "eval_wer": 0.3300551759627205, + "step": 57080 + }, + { + "epoch": 8.44, + "learning_rate": 5.7997032640949555e-06, + "loss": 0.9367, + "step": 57120 + }, + { + "epoch": 8.44, + "eval_loss": 0.9104089736938477, + "eval_runtime": 520.8712, + "eval_samples_per_second": 14.666, + "eval_wer": 0.3294548157465908, + "step": 57120 + }, + { + "epoch": 8.45, + "learning_rate": 5.796735905044511e-06, + "loss": 1.0239, + "step": 57160 + }, + { + "epoch": 8.45, + "eval_loss": 0.921783983707428, + "eval_runtime": 519.6084, + "eval_samples_per_second": 14.701, + "eval_wer": 0.3299694102175591, + "step": 57160 + }, + { + "epoch": 8.46, + "learning_rate": 5.793768545994066e-06, + "loss": 0.9771, + "step": 57200 + }, + { + "epoch": 8.46, + "eval_loss": 0.9457646608352661, + "eval_runtime": 519.73, + "eval_samples_per_second": 14.698, + "eval_wer": 0.3310843649046571, + "step": 57200 + }, + { + "epoch": 8.46, + "learning_rate": 5.790801186943621e-06, + "loss": 1.0812, + "step": 57240 + }, + { + "epoch": 8.46, + "eval_loss": 0.9282727241516113, + "eval_runtime": 520.7032, + "eval_samples_per_second": 14.671, + "eval_wer": 0.3304840046885274, + "step": 57240 + }, + { + "epoch": 8.47, + "learning_rate": 5.787833827893176e-06, + "loss": 1.0559, + "step": 57280 + }, + { + "epoch": 8.47, + "eval_loss": 0.8927995562553406, + "eval_runtime": 521.2975, + "eval_samples_per_second": 14.654, + "eval_wer": 0.327853855170245, + "step": 57280 + }, + { + "epoch": 8.47, + "learning_rate": 5.78486646884273e-06, + "loss": 1.1124, + "step": 57320 + }, + { + "epoch": 8.47, + "eval_loss": 0.9157091975212097, + "eval_runtime": 519.3607, + "eval_samples_per_second": 14.708, + "eval_wer": 0.3291975185111067, + "step": 57320 + }, + { + "epoch": 8.48, + "learning_rate": 5.781899109792285e-06, + "loss": 1.0054, + "step": 57360 + }, + { + "epoch": 8.48, + "eval_loss": 0.8768503665924072, + "eval_runtime": 520.0747, + "eval_samples_per_second": 14.688, + "eval_wer": 0.32708196346379254, + "step": 57360 + }, + { + "epoch": 8.48, + "learning_rate": 5.778931750741841e-06, + "loss": 0.9398, + "step": 57400 + }, + { + "epoch": 8.48, + "eval_loss": 0.9484142065048218, + "eval_runtime": 520.7553, + "eval_samples_per_second": 14.669, + "eval_wer": 0.3312558963949798, + "step": 57400 + }, + { + "epoch": 8.49, + "learning_rate": 5.775964391691395e-06, + "loss": 1.0392, + "step": 57440 + }, + { + "epoch": 8.49, + "eval_loss": 0.9325774312019348, + "eval_runtime": 518.8299, + "eval_samples_per_second": 14.724, + "eval_wer": 0.3298264673089568, + "step": 57440 + }, + { + "epoch": 8.5, + "learning_rate": 5.7729970326409505e-06, + "loss": 0.9835, + "step": 57480 + }, + { + "epoch": 8.5, + "eval_loss": 0.8984606266021729, + "eval_runtime": 520.6204, + "eval_samples_per_second": 14.673, + "eval_wer": 0.32753938077131994, + "step": 57480 + }, + { + "epoch": 8.5, + "learning_rate": 5.770029673590505e-06, + "loss": 0.946, + "step": 57520 + }, + { + "epoch": 8.5, + "eval_loss": 0.8988058567047119, + "eval_runtime": 520.0124, + "eval_samples_per_second": 14.69, + "eval_wer": 0.32719631779067443, + "step": 57520 + }, + { + "epoch": 8.51, + "learning_rate": 5.767062314540059e-06, + "loss": 0.982, + "step": 57560 + }, + { + "epoch": 8.51, + "eval_loss": 0.9295728802680969, + "eval_runtime": 519.8996, + "eval_samples_per_second": 14.693, + "eval_wer": 0.32899739843906345, + "step": 57560 + }, + { + "epoch": 8.51, + "learning_rate": 5.764094955489614e-06, + "loss": 0.9707, + "step": 57600 + }, + { + "epoch": 8.51, + "eval_loss": 0.9120326638221741, + "eval_runtime": 519.7129, + "eval_samples_per_second": 14.699, + "eval_wer": 0.3272534949541153, + "step": 57600 + }, + { + "epoch": 8.52, + "learning_rate": 5.76112759643917e-06, + "loss": 1.0249, + "step": 57640 + }, + { + "epoch": 8.52, + "eval_loss": 0.9056265950202942, + "eval_runtime": 520.4549, + "eval_samples_per_second": 14.678, + "eval_wer": 0.3276537350982018, + "step": 57640 + }, + { + "epoch": 8.53, + "learning_rate": 5.7581602373887244e-06, + "loss": 0.9632, + "step": 57680 + }, + { + "epoch": 8.53, + "eval_loss": 0.9068199992179871, + "eval_runtime": 521.5792, + "eval_samples_per_second": 14.646, + "eval_wer": 0.3277109122616427, + "step": 57680 + }, + { + "epoch": 8.53, + "learning_rate": 5.75519287833828e-06, + "loss": 1.0395, + "step": 57720 + }, + { + "epoch": 8.53, + "eval_loss": 0.8932336568832397, + "eval_runtime": 522.0034, + "eval_samples_per_second": 14.634, + "eval_wer": 0.32702478630035164, + "step": 57720 + }, + { + "epoch": 8.54, + "learning_rate": 5.752225519287834e-06, + "loss": 0.9301, + "step": 57760 + }, + { + "epoch": 8.54, + "eval_loss": 0.9215984344482422, + "eval_runtime": 520.9238, + "eval_samples_per_second": 14.664, + "eval_wer": 0.3281683295691701, + "step": 57760 + }, + { + "epoch": 8.54, + "learning_rate": 5.749258160237389e-06, + "loss": 0.9514, + "step": 57800 + }, + { + "epoch": 8.54, + "eval_loss": 0.9382808804512024, + "eval_runtime": 520.4552, + "eval_samples_per_second": 14.678, + "eval_wer": 0.32951199291003175, + "step": 57800 + }, + { + "epoch": 8.55, + "learning_rate": 5.746290801186945e-06, + "loss": 1.0112, + "step": 57840 + }, + { + "epoch": 8.55, + "eval_loss": 0.9337457418441772, + "eval_runtime": 519.4762, + "eval_samples_per_second": 14.705, + "eval_wer": 0.3291975185111067, + "step": 57840 + }, + { + "epoch": 8.56, + "learning_rate": 5.743323442136499e-06, + "loss": 0.9577, + "step": 57880 + }, + { + "epoch": 8.56, + "eval_loss": 0.9250739812850952, + "eval_runtime": 525.1846, + "eval_samples_per_second": 14.545, + "eval_wer": 0.32874010120357927, + "step": 57880 + }, + { + "epoch": 8.56, + "learning_rate": 5.740356083086054e-06, + "loss": 1.0929, + "step": 57920 + }, + { + "epoch": 8.56, + "eval_loss": 0.8524065017700195, + "eval_runtime": 518.9072, + "eval_samples_per_second": 14.721, + "eval_wer": 0.3238514537293805, + "step": 57920 + }, + { + "epoch": 8.57, + "learning_rate": 5.737388724035609e-06, + "loss": 1.0986, + "step": 57960 + }, + { + "epoch": 8.57, + "eval_loss": 0.8917619585990906, + "eval_runtime": 520.4733, + "eval_samples_per_second": 14.677, + "eval_wer": 0.3268246662283084, + "step": 57960 + }, + { + "epoch": 8.57, + "learning_rate": 5.734421364985163e-06, + "loss": 0.9841, + "step": 58000 + }, + { + "epoch": 8.57, + "eval_loss": 0.9380680918693542, + "eval_runtime": 519.3852, + "eval_samples_per_second": 14.708, + "eval_wer": 0.32994082163583865, + "step": 58000 + }, + { + "epoch": 8.58, + "learning_rate": 5.731454005934719e-06, + "loss": 0.9764, + "step": 58040 + }, + { + "epoch": 8.58, + "eval_loss": 0.913580060005188, + "eval_runtime": 519.4369, + "eval_samples_per_second": 14.706, + "eval_wer": 0.328597158294977, + "step": 58040 + }, + { + "epoch": 8.59, + "learning_rate": 5.728486646884274e-06, + "loss": 1.0643, + "step": 58080 + }, + { + "epoch": 8.59, + "eval_loss": 0.8903910517692566, + "eval_runtime": 519.7554, + "eval_samples_per_second": 14.697, + "eval_wer": 0.32731067211755627, + "step": 58080 + }, + { + "epoch": 8.59, + "learning_rate": 5.725519287833828e-06, + "loss": 1.0474, + "step": 58120 + }, + { + "epoch": 8.59, + "eval_loss": 0.8941999077796936, + "eval_runtime": 518.7722, + "eval_samples_per_second": 14.725, + "eval_wer": 0.3272249063723949, + "step": 58120 + }, + { + "epoch": 8.6, + "learning_rate": 5.722551928783383e-06, + "loss": 0.9935, + "step": 58160 + }, + { + "epoch": 8.6, + "eval_loss": 0.9200472831726074, + "eval_runtime": 518.9265, + "eval_samples_per_second": 14.721, + "eval_wer": 0.3291689299293862, + "step": 58160 + }, + { + "epoch": 8.6, + "learning_rate": 5.719584569732938e-06, + "loss": 1.0042, + "step": 58200 + }, + { + "epoch": 8.6, + "eval_loss": 0.9005509614944458, + "eval_runtime": 521.2402, + "eval_samples_per_second": 14.655, + "eval_wer": 0.3276537350982018, + "step": 58200 + }, + { + "epoch": 8.61, + "learning_rate": 5.716617210682493e-06, + "loss": 0.9264, + "step": 58240 + }, + { + "epoch": 8.61, + "eval_loss": 0.9317583441734314, + "eval_runtime": 521.4489, + "eval_samples_per_second": 14.65, + "eval_wer": 0.32985505589067726, + "step": 58240 + }, + { + "epoch": 8.61, + "learning_rate": 5.713649851632048e-06, + "loss": 1.0599, + "step": 58280 + }, + { + "epoch": 8.61, + "eval_loss": 0.9049041271209717, + "eval_runtime": 519.2085, + "eval_samples_per_second": 14.713, + "eval_wer": 0.3279396209154064, + "step": 58280 + }, + { + "epoch": 8.62, + "learning_rate": 5.710682492581603e-06, + "loss": 1.0566, + "step": 58320 + }, + { + "epoch": 8.62, + "eval_loss": 0.8973127603530884, + "eval_runtime": 520.5911, + "eval_samples_per_second": 14.674, + "eval_wer": 0.3276823236799222, + "step": 58320 + }, + { + "epoch": 8.63, + "learning_rate": 5.707715133531158e-06, + "loss": 1.042, + "step": 58360 + }, + { + "epoch": 8.63, + "eval_loss": 0.860248863697052, + "eval_runtime": 523.4686, + "eval_samples_per_second": 14.593, + "eval_wer": 0.32539523714228535, + "step": 58360 + }, + { + "epoch": 8.63, + "learning_rate": 5.704747774480712e-06, + "loss": 0.9887, + "step": 58400 + }, + { + "epoch": 8.63, + "eval_loss": 0.8829447627067566, + "eval_runtime": 517.3063, + "eval_samples_per_second": 14.767, + "eval_wer": 0.32679607764658797, + "step": 58400 + }, + { + "epoch": 8.64, + "learning_rate": 5.701780415430268e-06, + "loss": 0.9712, + "step": 58440 + }, + { + "epoch": 8.64, + "eval_loss": 0.9397531747817993, + "eval_runtime": 519.4765, + "eval_samples_per_second": 14.705, + "eval_wer": 0.331141542068098, + "step": 58440 + }, + { + "epoch": 8.64, + "learning_rate": 5.698813056379823e-06, + "loss": 0.9171, + "step": 58480 + }, + { + "epoch": 8.64, + "eval_loss": 0.8779546022415161, + "eval_runtime": 520.7137, + "eval_samples_per_second": 14.67, + "eval_wer": 0.3272534949541153, + "step": 58480 + }, + { + "epoch": 8.65, + "learning_rate": 5.695845697329377e-06, + "loss": 1.0557, + "step": 58520 + }, + { + "epoch": 8.65, + "eval_loss": 0.8860147595405579, + "eval_runtime": 519.3122, + "eval_samples_per_second": 14.71, + "eval_wer": 0.32831127247777236, + "step": 58520 + }, + { + "epoch": 8.66, + "learning_rate": 5.692878338278932e-06, + "loss": 1.1645, + "step": 58560 + }, + { + "epoch": 8.66, + "eval_loss": 0.9000404477119446, + "eval_runtime": 521.5265, + "eval_samples_per_second": 14.647, + "eval_wer": 0.3287115126218588, + "step": 58560 + }, + { + "epoch": 8.66, + "learning_rate": 5.689910979228487e-06, + "loss": 0.9266, + "step": 58600 + }, + { + "epoch": 8.66, + "eval_loss": 0.9192754626274109, + "eval_runtime": 523.8179, + "eval_samples_per_second": 14.583, + "eval_wer": 0.3302552960347637, + "step": 58600 + }, + { + "epoch": 8.67, + "learning_rate": 5.686943620178041e-06, + "loss": 0.9649, + "step": 58640 + }, + { + "epoch": 8.67, + "eval_loss": 0.8975840210914612, + "eval_runtime": 521.0375, + "eval_samples_per_second": 14.661, + "eval_wer": 0.32874010120357927, + "step": 58640 + }, + { + "epoch": 8.67, + "learning_rate": 5.683976261127597e-06, + "loss": 0.991, + "step": 58680 + }, + { + "epoch": 8.67, + "eval_loss": 0.904628574848175, + "eval_runtime": 520.6262, + "eval_samples_per_second": 14.673, + "eval_wer": 0.32848280396809515, + "step": 58680 + }, + { + "epoch": 8.68, + "learning_rate": 5.681008902077152e-06, + "loss": 1.0155, + "step": 58720 + }, + { + "epoch": 8.68, + "eval_loss": 0.8757663369178772, + "eval_runtime": 521.1609, + "eval_samples_per_second": 14.658, + "eval_wer": 0.3277109122616427, + "step": 58720 + }, + { + "epoch": 8.69, + "learning_rate": 5.678041543026706e-06, + "loss": 1.0011, + "step": 58760 + }, + { + "epoch": 8.69, + "eval_loss": 0.8615052103996277, + "eval_runtime": 520.324, + "eval_samples_per_second": 14.681, + "eval_wer": 0.3265673689928243, + "step": 58760 + }, + { + "epoch": 8.69, + "learning_rate": 5.6750741839762615e-06, + "loss": 0.9705, + "step": 58800 + }, + { + "epoch": 8.69, + "eval_loss": 0.8760775327682495, + "eval_runtime": 521.3131, + "eval_samples_per_second": 14.653, + "eval_wer": 0.3269676091369107, + "step": 58800 + }, + { + "epoch": 8.7, + "learning_rate": 5.672106824925816e-06, + "loss": 0.9577, + "step": 58840 + }, + { + "epoch": 8.7, + "eval_loss": 0.914139449596405, + "eval_runtime": 523.9299, + "eval_samples_per_second": 14.58, + "eval_wer": 0.3297978787272363, + "step": 58840 + }, + { + "epoch": 8.7, + "learning_rate": 5.669139465875372e-06, + "loss": 1.0501, + "step": 58880 + }, + { + "epoch": 8.7, + "eval_loss": 0.8925902843475342, + "eval_runtime": 519.8138, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3293690500014294, + "step": 58880 + }, + { + "epoch": 8.71, + "learning_rate": 5.6661721068249265e-06, + "loss": 0.9835, + "step": 58920 + }, + { + "epoch": 8.71, + "eval_loss": 0.8788085579872131, + "eval_runtime": 520.2307, + "eval_samples_per_second": 14.684, + "eval_wer": 0.32802538666056774, + "step": 58920 + }, + { + "epoch": 8.72, + "learning_rate": 5.663204747774481e-06, + "loss": 0.9653, + "step": 58960 + }, + { + "epoch": 8.72, + "eval_loss": 0.861724317073822, + "eval_runtime": 519.9306, + "eval_samples_per_second": 14.692, + "eval_wer": 0.3268246662283084, + "step": 58960 + }, + { + "epoch": 8.72, + "learning_rate": 5.6602373887240354e-06, + "loss": 1.0375, + "step": 59000 + }, + { + "epoch": 8.72, + "eval_loss": 0.8560379147529602, + "eval_runtime": 519.7998, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3271391406272335, + "step": 59000 + }, + { + "epoch": 8.73, + "learning_rate": 5.657270029673591e-06, + "loss": 0.981, + "step": 59040 + }, + { + "epoch": 8.73, + "eval_loss": 0.9250243306159973, + "eval_runtime": 520.7725, + "eval_samples_per_second": 14.669, + "eval_wer": 0.33102718774121614, + "step": 59040 + }, + { + "epoch": 8.73, + "learning_rate": 5.654302670623146e-06, + "loss": 0.9514, + "step": 59080 + }, + { + "epoch": 8.73, + "eval_loss": 0.9064039587974548, + "eval_runtime": 523.5965, + "eval_samples_per_second": 14.589, + "eval_wer": 0.32976929014551587, + "step": 59080 + }, + { + "epoch": 8.74, + "learning_rate": 5.651335311572701e-06, + "loss": 0.9802, + "step": 59120 + }, + { + "epoch": 8.74, + "eval_loss": 0.8884864449501038, + "eval_runtime": 520.4021, + "eval_samples_per_second": 14.679, + "eval_wer": 0.32853998113153604, + "step": 59120 + }, + { + "epoch": 8.74, + "learning_rate": 5.648367952522256e-06, + "loss": 0.9699, + "step": 59160 + }, + { + "epoch": 8.74, + "eval_loss": 0.9057693481445312, + "eval_runtime": 520.9002, + "eval_samples_per_second": 14.665, + "eval_wer": 0.3302552960347637, + "step": 59160 + }, + { + "epoch": 8.75, + "learning_rate": 5.64540059347181e-06, + "loss": 0.9193, + "step": 59200 + }, + { + "epoch": 8.75, + "eval_loss": 0.9195528030395508, + "eval_runtime": 522.244, + "eval_samples_per_second": 14.627, + "eval_wer": 0.3312558963949798, + "step": 59200 + }, + { + "epoch": 8.76, + "learning_rate": 5.642433234421365e-06, + "loss": 0.9427, + "step": 59240 + }, + { + "epoch": 8.76, + "eval_loss": 0.9064352512359619, + "eval_runtime": 519.2256, + "eval_samples_per_second": 14.712, + "eval_wer": 0.33036965036164556, + "step": 59240 + }, + { + "epoch": 8.76, + "learning_rate": 5.639465875370921e-06, + "loss": 0.9946, + "step": 59280 + }, + { + "epoch": 8.76, + "eval_loss": 0.9065017700195312, + "eval_runtime": 522.1475, + "eval_samples_per_second": 14.63, + "eval_wer": 0.32976929014551587, + "step": 59280 + }, + { + "epoch": 8.77, + "learning_rate": 5.636498516320475e-06, + "loss": 1.0226, + "step": 59320 + }, + { + "epoch": 8.77, + "eval_loss": 0.8543415665626526, + "eval_runtime": 520.1343, + "eval_samples_per_second": 14.687, + "eval_wer": 0.3255953572143286, + "step": 59320 + }, + { + "epoch": 8.77, + "learning_rate": 5.6335311572700305e-06, + "loss": 0.9967, + "step": 59360 + }, + { + "epoch": 8.77, + "eval_loss": 0.8975327014923096, + "eval_runtime": 520.591, + "eval_samples_per_second": 14.674, + "eval_wer": 0.3292261070928271, + "step": 59360 + }, + { + "epoch": 8.78, + "learning_rate": 5.630563798219585e-06, + "loss": 0.9738, + "step": 59400 + }, + { + "epoch": 8.78, + "eval_loss": 0.9211122989654541, + "eval_runtime": 520.5783, + "eval_samples_per_second": 14.674, + "eval_wer": 0.3307413019240116, + "step": 59400 + }, + { + "epoch": 8.79, + "learning_rate": 5.627596439169139e-06, + "loss": 1.0756, + "step": 59440 + }, + { + "epoch": 8.79, + "eval_loss": 0.8780083060264587, + "eval_runtime": 520.3268, + "eval_samples_per_second": 14.681, + "eval_wer": 0.32702478630035164, + "step": 59440 + }, + { + "epoch": 8.79, + "learning_rate": 5.6246290801186955e-06, + "loss": 0.9634, + "step": 59480 + }, + { + "epoch": 8.79, + "eval_loss": 0.926011860370636, + "eval_runtime": 519.7187, + "eval_samples_per_second": 14.698, + "eval_wer": 0.3309985991594957, + "step": 59480 + }, + { + "epoch": 8.8, + "learning_rate": 5.62166172106825e-06, + "loss": 0.953, + "step": 59520 + }, + { + "epoch": 8.8, + "eval_loss": 0.8671967387199402, + "eval_runtime": 521.1907, + "eval_samples_per_second": 14.657, + "eval_wer": 0.3257383001229309, + "step": 59520 + }, + { + "epoch": 8.8, + "learning_rate": 5.618694362017804e-06, + "loss": 0.937, + "step": 59560 + }, + { + "epoch": 8.8, + "eval_loss": 0.9115512371063232, + "eval_runtime": 523.1977, + "eval_samples_per_second": 14.601, + "eval_wer": 0.32965493581863403, + "step": 59560 + }, + { + "epoch": 8.81, + "learning_rate": 5.61572700296736e-06, + "loss": 0.9954, + "step": 59600 + }, + { + "epoch": 8.81, + "eval_loss": 0.8873656392097473, + "eval_runtime": 519.7025, + "eval_samples_per_second": 14.699, + "eval_wer": 0.3277109122616427, + "step": 59600 + }, + { + "epoch": 8.82, + "learning_rate": 5.612759643916914e-06, + "loss": 1.0248, + "step": 59640 + }, + { + "epoch": 8.82, + "eval_loss": 0.8863810896873474, + "eval_runtime": 519.6567, + "eval_samples_per_second": 14.7, + "eval_wer": 0.3273964378627176, + "step": 59640 + }, + { + "epoch": 8.82, + "learning_rate": 5.6097922848664686e-06, + "loss": 0.9731, + "step": 59680 + }, + { + "epoch": 8.82, + "eval_loss": 0.9051077365875244, + "eval_runtime": 520.3827, + "eval_samples_per_second": 14.68, + "eval_wer": 0.328968809857343, + "step": 59680 + }, + { + "epoch": 8.83, + "learning_rate": 5.606824925816025e-06, + "loss": 0.9901, + "step": 59720 + }, + { + "epoch": 8.83, + "eval_loss": 0.9231013655662537, + "eval_runtime": 520.2673, + "eval_samples_per_second": 14.683, + "eval_wer": 0.3306269475971297, + "step": 59720 + }, + { + "epoch": 8.83, + "learning_rate": 5.603857566765579e-06, + "loss": 1.0422, + "step": 59760 + }, + { + "epoch": 8.83, + "eval_loss": 0.8664190769195557, + "eval_runtime": 520.2291, + "eval_samples_per_second": 14.684, + "eval_wer": 0.3263100717573401, + "step": 59760 + }, + { + "epoch": 8.84, + "learning_rate": 5.600890207715134e-06, + "loss": 0.9283, + "step": 59800 + }, + { + "epoch": 8.84, + "eval_loss": 0.897261381149292, + "eval_runtime": 524.898, + "eval_samples_per_second": 14.553, + "eval_wer": 0.32856856971325654, + "step": 59800 + }, + { + "epoch": 8.85, + "learning_rate": 5.597922848664689e-06, + "loss": 0.9746, + "step": 59840 + }, + { + "epoch": 8.85, + "eval_loss": 0.8954948782920837, + "eval_runtime": 519.482, + "eval_samples_per_second": 14.705, + "eval_wer": 0.32833986105949287, + "step": 59840 + }, + { + "epoch": 8.85, + "learning_rate": 5.594955489614243e-06, + "loss": 0.9697, + "step": 59880 + }, + { + "epoch": 8.85, + "eval_loss": 0.9146578311920166, + "eval_runtime": 520.8069, + "eval_samples_per_second": 14.668, + "eval_wer": 0.33042682752508645, + "step": 59880 + }, + { + "epoch": 8.86, + "learning_rate": 5.5919881305637995e-06, + "loss": 1.0429, + "step": 59920 + }, + { + "epoch": 8.86, + "eval_loss": 0.867885947227478, + "eval_runtime": 520.4667, + "eval_samples_per_second": 14.677, + "eval_wer": 0.326738900483147, + "step": 59920 + }, + { + "epoch": 8.86, + "learning_rate": 5.589020771513354e-06, + "loss": 1.001, + "step": 59960 + }, + { + "epoch": 8.86, + "eval_loss": 0.9102554321289062, + "eval_runtime": 520.1814, + "eval_samples_per_second": 14.685, + "eval_wer": 0.33028388461648417, + "step": 59960 + }, + { + "epoch": 8.87, + "learning_rate": 5.586053412462908e-06, + "loss": 0.9847, + "step": 60000 + }, + { + "epoch": 8.87, + "eval_loss": 0.8914312720298767, + "eval_runtime": 521.6994, + "eval_samples_per_second": 14.643, + "eval_wer": 0.32874010120357927, + "step": 60000 + }, + { + "epoch": 8.87, + "learning_rate": 5.583086053412463e-06, + "loss": 0.9928, + "step": 60040 + }, + { + "epoch": 8.87, + "eval_loss": 0.9106556177139282, + "eval_runtime": 520.9759, + "eval_samples_per_second": 14.663, + "eval_wer": 0.32985505589067726, + "step": 60040 + }, + { + "epoch": 8.88, + "learning_rate": 5.580118694362018e-06, + "loss": 0.9858, + "step": 60080 + }, + { + "epoch": 8.88, + "eval_loss": 0.8965376615524292, + "eval_runtime": 520.7241, + "eval_samples_per_second": 14.67, + "eval_wer": 0.3287972783670202, + "step": 60080 + }, + { + "epoch": 8.89, + "learning_rate": 5.577151335311573e-06, + "loss": 0.9156, + "step": 60120 + }, + { + "epoch": 8.89, + "eval_loss": 0.9081794619560242, + "eval_runtime": 519.7944, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3295405814917522, + "step": 60120 + }, + { + "epoch": 8.89, + "learning_rate": 5.574183976261129e-06, + "loss": 0.9879, + "step": 60160 + }, + { + "epoch": 8.89, + "eval_loss": 0.9024932980537415, + "eval_runtime": 521.9198, + "eval_samples_per_second": 14.636, + "eval_wer": 0.32956917007347264, + "step": 60160 + }, + { + "epoch": 8.9, + "learning_rate": 5.571216617210683e-06, + "loss": 1.0866, + "step": 60200 + }, + { + "epoch": 8.9, + "eval_loss": 0.8938391804695129, + "eval_runtime": 521.6275, + "eval_samples_per_second": 14.645, + "eval_wer": 0.32942622716487036, + "step": 60200 + }, + { + "epoch": 8.9, + "learning_rate": 5.5682492581602375e-06, + "loss": 0.9349, + "step": 60240 + }, + { + "epoch": 8.9, + "eval_loss": 0.9137777090072632, + "eval_runtime": 520.0896, + "eval_samples_per_second": 14.688, + "eval_wer": 0.33045541610680695, + "step": 60240 + }, + { + "epoch": 8.91, + "learning_rate": 5.565281899109792e-06, + "loss": 1.0244, + "step": 60280 + }, + { + "epoch": 8.91, + "eval_loss": 0.8982388377189636, + "eval_runtime": 519.6431, + "eval_samples_per_second": 14.7, + "eval_wer": 0.3291975185111067, + "step": 60280 + }, + { + "epoch": 8.92, + "learning_rate": 5.562314540059348e-06, + "loss": 0.9629, + "step": 60320 + }, + { + "epoch": 8.92, + "eval_loss": 0.9411712884902954, + "eval_runtime": 520.2191, + "eval_samples_per_second": 14.684, + "eval_wer": 0.3335429829326167, + "step": 60320 + }, + { + "epoch": 8.92, + "learning_rate": 5.5593471810089025e-06, + "loss": 0.9403, + "step": 60360 + }, + { + "epoch": 8.92, + "eval_loss": 0.912858247756958, + "eval_runtime": 522.3781, + "eval_samples_per_second": 14.624, + "eval_wer": 0.3301409417078819, + "step": 60360 + }, + { + "epoch": 8.93, + "learning_rate": 5.556379821958458e-06, + "loss": 1.0085, + "step": 60400 + }, + { + "epoch": 8.93, + "eval_loss": 0.9047226309776306, + "eval_runtime": 521.6863, + "eval_samples_per_second": 14.643, + "eval_wer": 0.3302267074530433, + "step": 60400 + }, + { + "epoch": 8.93, + "learning_rate": 5.553412462908012e-06, + "loss": 1.0173, + "step": 60440 + }, + { + "epoch": 8.93, + "eval_loss": 0.8612624406814575, + "eval_runtime": 520.75, + "eval_samples_per_second": 14.669, + "eval_wer": 0.3260241859401355, + "step": 60440 + }, + { + "epoch": 8.94, + "learning_rate": 5.550445103857567e-06, + "loss": 0.9828, + "step": 60480 + }, + { + "epoch": 8.94, + "eval_loss": 0.8574054837226868, + "eval_runtime": 520.4035, + "eval_samples_per_second": 14.679, + "eval_wer": 0.32568112295949, + "step": 60480 + }, + { + "epoch": 8.95, + "learning_rate": 5.547477744807123e-06, + "loss": 0.9269, + "step": 60520 + }, + { + "epoch": 8.95, + "eval_loss": 0.8913673758506775, + "eval_runtime": 520.2768, + "eval_samples_per_second": 14.683, + "eval_wer": 0.32856856971325654, + "step": 60520 + }, + { + "epoch": 8.95, + "learning_rate": 5.544510385756677e-06, + "loss": 0.9868, + "step": 60560 + }, + { + "epoch": 8.95, + "eval_loss": 0.8929964303970337, + "eval_runtime": 521.8046, + "eval_samples_per_second": 14.64, + "eval_wer": 0.32796820949712685, + "step": 60560 + }, + { + "epoch": 8.96, + "learning_rate": 5.541543026706232e-06, + "loss": 1.0992, + "step": 60600 + }, + { + "epoch": 8.96, + "eval_loss": 0.8498595356941223, + "eval_runtime": 521.9137, + "eval_samples_per_second": 14.637, + "eval_wer": 0.32488064267131705, + "step": 60600 + }, + { + "epoch": 8.96, + "learning_rate": 5.538575667655787e-06, + "loss": 0.9399, + "step": 60640 + }, + { + "epoch": 8.96, + "eval_loss": 0.8748541474342346, + "eval_runtime": 526.3293, + "eval_samples_per_second": 14.514, + "eval_wer": 0.326052774521856, + "step": 60640 + }, + { + "epoch": 8.97, + "learning_rate": 5.5356083086053415e-06, + "loss": 1.0001, + "step": 60680 + }, + { + "epoch": 8.97, + "eval_loss": 0.8965076208114624, + "eval_runtime": 521.2526, + "eval_samples_per_second": 14.655, + "eval_wer": 0.32759655793476083, + "step": 60680 + }, + { + "epoch": 8.98, + "learning_rate": 5.532640949554896e-06, + "loss": 0.9923, + "step": 60720 + }, + { + "epoch": 8.98, + "eval_loss": 0.8646832704544067, + "eval_runtime": 524.0144, + "eval_samples_per_second": 14.578, + "eval_wer": 0.3258812430315332, + "step": 60720 + }, + { + "epoch": 8.98, + "learning_rate": 5.529673590504452e-06, + "loss": 0.9833, + "step": 60760 + }, + { + "epoch": 8.98, + "eval_loss": 0.8755890727043152, + "eval_runtime": 522.5819, + "eval_samples_per_second": 14.618, + "eval_wer": 0.32642442608422195, + "step": 60760 + }, + { + "epoch": 8.99, + "learning_rate": 5.5267062314540065e-06, + "loss": 0.9802, + "step": 60800 + }, + { + "epoch": 8.99, + "eval_loss": 0.9241328835487366, + "eval_runtime": 521.004, + "eval_samples_per_second": 14.662, + "eval_wer": 0.33036965036164556, + "step": 60800 + }, + { + "epoch": 8.99, + "learning_rate": 5.523738872403561e-06, + "loss": 1.0772, + "step": 60840 + }, + { + "epoch": 8.99, + "eval_loss": 0.8718317151069641, + "eval_runtime": 521.7743, + "eval_samples_per_second": 14.64, + "eval_wer": 0.32642442608422195, + "step": 60840 + }, + { + "epoch": 9.0, + "learning_rate": 5.520771513353116e-06, + "loss": 1.0238, + "step": 60880 + }, + { + "epoch": 9.0, + "eval_loss": 0.8889086246490479, + "eval_runtime": 521.7892, + "eval_samples_per_second": 14.64, + "eval_wer": 0.32856856971325654, + "step": 60880 + }, + { + "epoch": 9.01, + "learning_rate": 5.517804154302671e-06, + "loss": 1.0146, + "step": 60920 + }, + { + "epoch": 9.01, + "eval_loss": 0.8723910450935364, + "eval_runtime": 518.9411, + "eval_samples_per_second": 14.72, + "eval_wer": 0.32668172331970613, + "step": 60920 + }, + { + "epoch": 9.01, + "learning_rate": 5.514836795252226e-06, + "loss": 0.9189, + "step": 60960 + }, + { + "epoch": 9.01, + "eval_loss": 0.9072814583778381, + "eval_runtime": 520.7453, + "eval_samples_per_second": 14.669, + "eval_wer": 0.3290259870207839, + "step": 60960 + }, + { + "epoch": 9.02, + "learning_rate": 5.511869436201781e-06, + "loss": 0.9867, + "step": 61000 + }, + { + "epoch": 9.02, + "eval_loss": 0.929558277130127, + "eval_runtime": 521.1986, + "eval_samples_per_second": 14.657, + "eval_wer": 0.33042682752508645, + "step": 61000 + }, + { + "epoch": 9.02, + "learning_rate": 5.508902077151336e-06, + "loss": 0.99, + "step": 61040 + }, + { + "epoch": 9.02, + "eval_loss": 0.8509811162948608, + "eval_runtime": 520.8781, + "eval_samples_per_second": 14.666, + "eval_wer": 0.3242802824551874, + "step": 61040 + }, + { + "epoch": 9.03, + "learning_rate": 5.50593471810089e-06, + "loss": 0.9695, + "step": 61080 + }, + { + "epoch": 9.03, + "eval_loss": 0.8567344546318054, + "eval_runtime": 522.0111, + "eval_samples_per_second": 14.634, + "eval_wer": 0.3250235855799194, + "step": 61080 + }, + { + "epoch": 9.03, + "learning_rate": 5.502967359050445e-06, + "loss": 1.0083, + "step": 61120 + }, + { + "epoch": 9.03, + "eval_loss": 0.867013156414032, + "eval_runtime": 520.9806, + "eval_samples_per_second": 14.663, + "eval_wer": 0.3248520540895966, + "step": 61120 + }, + { + "epoch": 9.04, + "learning_rate": 5.500000000000001e-06, + "loss": 0.9743, + "step": 61160 + }, + { + "epoch": 9.04, + "eval_loss": 0.9137815833091736, + "eval_runtime": 520.1546, + "eval_samples_per_second": 14.686, + "eval_wer": 0.328597158294977, + "step": 61160 + }, + { + "epoch": 9.05, + "learning_rate": 5.497032640949556e-06, + "loss": 0.9267, + "step": 61200 + }, + { + "epoch": 9.05, + "eval_loss": 0.9132623076438904, + "eval_runtime": 520.0272, + "eval_samples_per_second": 14.69, + "eval_wer": 0.3287115126218588, + "step": 61200 + }, + { + "epoch": 9.05, + "learning_rate": 5.4940652818991104e-06, + "loss": 0.9289, + "step": 61240 + }, + { + "epoch": 9.05, + "eval_loss": 0.939371645450592, + "eval_runtime": 520.6709, + "eval_samples_per_second": 14.671, + "eval_wer": 0.33059835901540924, + "step": 61240 + }, + { + "epoch": 9.06, + "learning_rate": 5.491097922848665e-06, + "loss": 0.9271, + "step": 61280 + }, + { + "epoch": 9.06, + "eval_loss": 0.9191766977310181, + "eval_runtime": 520.0239, + "eval_samples_per_second": 14.69, + "eval_wer": 0.328968809857343, + "step": 61280 + }, + { + "epoch": 9.06, + "learning_rate": 5.488130563798219e-06, + "loss": 0.955, + "step": 61320 + }, + { + "epoch": 9.06, + "eval_loss": 0.9158635139465332, + "eval_runtime": 520.4795, + "eval_samples_per_second": 14.677, + "eval_wer": 0.32934046141970896, + "step": 61320 + }, + { + "epoch": 9.07, + "learning_rate": 5.4851632047477755e-06, + "loss": 1.0303, + "step": 61360 + }, + { + "epoch": 9.07, + "eval_loss": 0.8932636380195618, + "eval_runtime": 520.7563, + "eval_samples_per_second": 14.669, + "eval_wer": 0.32805397524228824, + "step": 61360 + }, + { + "epoch": 9.08, + "learning_rate": 5.48219584569733e-06, + "loss": 0.9348, + "step": 61400 + }, + { + "epoch": 9.08, + "eval_loss": 0.9475846886634827, + "eval_runtime": 521.4068, + "eval_samples_per_second": 14.651, + "eval_wer": 0.3316847251207868, + "step": 61400 + }, + { + "epoch": 9.08, + "learning_rate": 5.479228486646885e-06, + "loss": 1.0098, + "step": 61440 + }, + { + "epoch": 9.08, + "eval_loss": 0.8940609693527222, + "eval_runtime": 521.1693, + "eval_samples_per_second": 14.657, + "eval_wer": 0.32805397524228824, + "step": 61440 + }, + { + "epoch": 9.09, + "learning_rate": 5.47626112759644e-06, + "loss": 0.9229, + "step": 61480 + }, + { + "epoch": 9.09, + "eval_loss": 0.9015146493911743, + "eval_runtime": 522.5612, + "eval_samples_per_second": 14.618, + "eval_wer": 0.3283684496412133, + "step": 61480 + }, + { + "epoch": 9.09, + "learning_rate": 5.473293768545994e-06, + "loss": 0.9515, + "step": 61520 + }, + { + "epoch": 9.09, + "eval_loss": 0.9430288672447205, + "eval_runtime": 521.5053, + "eval_samples_per_second": 14.648, + "eval_wer": 0.3317704908659481, + "step": 61520 + }, + { + "epoch": 9.1, + "learning_rate": 5.47032640949555e-06, + "loss": 1.0288, + "step": 61560 + }, + { + "epoch": 9.1, + "eval_loss": 0.893963634967804, + "eval_runtime": 520.1132, + "eval_samples_per_second": 14.687, + "eval_wer": 0.3279110323336859, + "step": 61560 + }, + { + "epoch": 9.11, + "learning_rate": 5.467359050445105e-06, + "loss": 0.9751, + "step": 61600 + }, + { + "epoch": 9.11, + "eval_loss": 0.910978376865387, + "eval_runtime": 521.0275, + "eval_samples_per_second": 14.661, + "eval_wer": 0.3287972783670202, + "step": 61600 + }, + { + "epoch": 9.11, + "learning_rate": 5.464391691394659e-06, + "loss": 0.9702, + "step": 61640 + }, + { + "epoch": 9.11, + "eval_loss": 0.8712512254714966, + "eval_runtime": 521.994, + "eval_samples_per_second": 14.634, + "eval_wer": 0.32585265444981276, + "step": 61640 + }, + { + "epoch": 9.12, + "learning_rate": 5.461424332344214e-06, + "loss": 0.9641, + "step": 61680 + }, + { + "epoch": 9.12, + "eval_loss": 0.9221763014793396, + "eval_runtime": 521.528, + "eval_samples_per_second": 14.647, + "eval_wer": 0.32899739843906345, + "step": 61680 + }, + { + "epoch": 9.12, + "learning_rate": 5.458456973293769e-06, + "loss": 1.0054, + "step": 61720 + }, + { + "epoch": 9.12, + "eval_loss": 0.8714380264282227, + "eval_runtime": 520.8777, + "eval_samples_per_second": 14.666, + "eval_wer": 0.32530947139712396, + "step": 61720 + }, + { + "epoch": 9.13, + "learning_rate": 5.455489614243323e-06, + "loss": 1.0149, + "step": 61760 + }, + { + "epoch": 9.13, + "eval_loss": 0.88200843334198, + "eval_runtime": 521.2415, + "eval_samples_per_second": 14.655, + "eval_wer": 0.3265673689928243, + "step": 61760 + }, + { + "epoch": 9.14, + "learning_rate": 5.452522255192879e-06, + "loss": 0.9987, + "step": 61800 + }, + { + "epoch": 9.14, + "eval_loss": 0.8826965689659119, + "eval_runtime": 521.9692, + "eval_samples_per_second": 14.635, + "eval_wer": 0.326052774521856, + "step": 61800 + }, + { + "epoch": 9.14, + "learning_rate": 5.449554896142434e-06, + "loss": 0.9887, + "step": 61840 + }, + { + "epoch": 9.14, + "eval_loss": 0.897479236125946, + "eval_runtime": 522.197, + "eval_samples_per_second": 14.629, + "eval_wer": 0.3272534949541153, + "step": 61840 + }, + { + "epoch": 9.15, + "learning_rate": 5.446587537091988e-06, + "loss": 0.9869, + "step": 61880 + }, + { + "epoch": 9.15, + "eval_loss": 0.9168394804000854, + "eval_runtime": 523.6635, + "eval_samples_per_second": 14.588, + "eval_wer": 0.3287972783670202, + "step": 61880 + }, + { + "epoch": 9.15, + "learning_rate": 5.4436201780415436e-06, + "loss": 0.9072, + "step": 61920 + }, + { + "epoch": 9.15, + "eval_loss": 0.9074807167053223, + "eval_runtime": 521.8051, + "eval_samples_per_second": 14.64, + "eval_wer": 0.32745361502615855, + "step": 61920 + }, + { + "epoch": 9.16, + "learning_rate": 5.440652818991098e-06, + "loss": 1.01, + "step": 61960 + }, + { + "epoch": 9.16, + "eval_loss": 0.8701136112213135, + "eval_runtime": 522.2494, + "eval_samples_per_second": 14.627, + "eval_wer": 0.32548100288744675, + "step": 61960 + }, + { + "epoch": 9.16, + "learning_rate": 5.437685459940653e-06, + "loss": 0.9646, + "step": 62000 + }, + { + "epoch": 9.16, + "eval_loss": 0.906278133392334, + "eval_runtime": 523.7522, + "eval_samples_per_second": 14.585, + "eval_wer": 0.3274250264444381, + "step": 62000 + }, + { + "epoch": 9.17, + "learning_rate": 5.434718100890209e-06, + "loss": 0.9518, + "step": 62040 + }, + { + "epoch": 9.17, + "eval_loss": 0.9330311417579651, + "eval_runtime": 526.7902, + "eval_samples_per_second": 14.501, + "eval_wer": 0.32976929014551587, + "step": 62040 + }, + { + "epoch": 9.18, + "learning_rate": 5.431750741839763e-06, + "loss": 0.982, + "step": 62080 + }, + { + "epoch": 9.18, + "eval_loss": 0.9016255736351013, + "eval_runtime": 526.782, + "eval_samples_per_second": 14.501, + "eval_wer": 0.32708196346379254, + "step": 62080 + }, + { + "epoch": 9.18, + "learning_rate": 5.4287833827893175e-06, + "loss": 0.9341, + "step": 62120 + }, + { + "epoch": 9.18, + "eval_loss": 0.93901127576828, + "eval_runtime": 524.6347, + "eval_samples_per_second": 14.561, + "eval_wer": 0.3296835244003545, + "step": 62120 + }, + { + "epoch": 9.19, + "learning_rate": 5.425816023738873e-06, + "loss": 0.9076, + "step": 62160 + }, + { + "epoch": 9.19, + "eval_loss": 0.9232743382453918, + "eval_runtime": 521.6529, + "eval_samples_per_second": 14.644, + "eval_wer": 0.32905457560250434, + "step": 62160 + }, + { + "epoch": 9.19, + "learning_rate": 5.422848664688428e-06, + "loss": 0.9411, + "step": 62200 + }, + { + "epoch": 9.19, + "eval_loss": 0.9490613341331482, + "eval_runtime": 523.0499, + "eval_samples_per_second": 14.605, + "eval_wer": 0.3313702507218617, + "step": 62200 + }, + { + "epoch": 9.2, + "learning_rate": 5.4198813056379825e-06, + "loss": 0.9697, + "step": 62240 + }, + { + "epoch": 9.2, + "eval_loss": 0.9218747615814209, + "eval_runtime": 522.7853, + "eval_samples_per_second": 14.612, + "eval_wer": 0.3293118728379885, + "step": 62240 + }, + { + "epoch": 9.21, + "learning_rate": 5.416913946587538e-06, + "loss": 0.9666, + "step": 62280 + }, + { + "epoch": 9.21, + "eval_loss": 0.9257290959358215, + "eval_runtime": 525.9524, + "eval_samples_per_second": 14.524, + "eval_wer": 0.3288830441121816, + "step": 62280 + }, + { + "epoch": 9.21, + "learning_rate": 5.413946587537092e-06, + "loss": 0.9073, + "step": 62320 + }, + { + "epoch": 9.21, + "eval_loss": 0.9206984043121338, + "eval_runtime": 524.043, + "eval_samples_per_second": 14.577, + "eval_wer": 0.3281683295691701, + "step": 62320 + }, + { + "epoch": 9.22, + "learning_rate": 5.410979228486647e-06, + "loss": 0.9981, + "step": 62360 + }, + { + "epoch": 9.22, + "eval_loss": 0.910703182220459, + "eval_runtime": 525.1849, + "eval_samples_per_second": 14.545, + "eval_wer": 0.3275107921895995, + "step": 62360 + }, + { + "epoch": 9.22, + "learning_rate": 5.408011869436203e-06, + "loss": 1.0432, + "step": 62400 + }, + { + "epoch": 9.22, + "eval_loss": 0.901178777217865, + "eval_runtime": 524.011, + "eval_samples_per_second": 14.578, + "eval_wer": 0.32759655793476083, + "step": 62400 + }, + { + "epoch": 9.23, + "learning_rate": 5.405044510385757e-06, + "loss": 1.0066, + "step": 62440 + }, + { + "epoch": 9.23, + "eval_loss": 0.9250192642211914, + "eval_runtime": 525.202, + "eval_samples_per_second": 14.545, + "eval_wer": 0.3292261070928271, + "step": 62440 + }, + { + "epoch": 9.24, + "learning_rate": 5.402077151335312e-06, + "loss": 1.0367, + "step": 62480 + }, + { + "epoch": 9.24, + "eval_loss": 0.89219069480896, + "eval_runtime": 525.7372, + "eval_samples_per_second": 14.53, + "eval_wer": 0.3272534949541153, + "step": 62480 + }, + { + "epoch": 9.24, + "learning_rate": 5.399109792284867e-06, + "loss": 1.001, + "step": 62520 + }, + { + "epoch": 9.24, + "eval_loss": 0.8632076978683472, + "eval_runtime": 525.3439, + "eval_samples_per_second": 14.541, + "eval_wer": 0.32482346550787616, + "step": 62520 + }, + { + "epoch": 9.25, + "learning_rate": 5.396142433234421e-06, + "loss": 0.9918, + "step": 62560 + }, + { + "epoch": 9.25, + "eval_loss": 0.9203102588653564, + "eval_runtime": 524.6203, + "eval_samples_per_second": 14.561, + "eval_wer": 0.3287115126218588, + "step": 62560 + }, + { + "epoch": 9.25, + "learning_rate": 5.3931750741839776e-06, + "loss": 1.0215, + "step": 62600 + }, + { + "epoch": 9.25, + "eval_loss": 0.8672576546669006, + "eval_runtime": 525.093, + "eval_samples_per_second": 14.548, + "eval_wer": 0.3256239457960491, + "step": 62600 + }, + { + "epoch": 9.26, + "learning_rate": 5.390207715133532e-06, + "loss": 0.9991, + "step": 62640 + }, + { + "epoch": 9.26, + "eval_loss": 0.8709724545478821, + "eval_runtime": 522.5337, + "eval_samples_per_second": 14.619, + "eval_wer": 0.32636724892078106, + "step": 62640 + }, + { + "epoch": 9.27, + "learning_rate": 5.3872403560830864e-06, + "loss": 1.1186, + "step": 62680 + }, + { + "epoch": 9.27, + "eval_loss": 0.8482937812805176, + "eval_runtime": 521.0002, + "eval_samples_per_second": 14.662, + "eval_wer": 0.3244232253637897, + "step": 62680 + }, + { + "epoch": 9.27, + "learning_rate": 5.384272997032641e-06, + "loss": 1.0169, + "step": 62720 + }, + { + "epoch": 9.27, + "eval_loss": 0.8774898052215576, + "eval_runtime": 520.8077, + "eval_samples_per_second": 14.668, + "eval_wer": 0.32613854026701733, + "step": 62720 + }, + { + "epoch": 9.28, + "learning_rate": 5.381305637982196e-06, + "loss": 0.9136, + "step": 62760 + }, + { + "epoch": 9.28, + "eval_loss": 0.8759512305259705, + "eval_runtime": 520.5315, + "eval_samples_per_second": 14.675, + "eval_wer": 0.3257097115412104, + "step": 62760 + }, + { + "epoch": 9.28, + "learning_rate": 5.378338278931751e-06, + "loss": 0.8875, + "step": 62800 + }, + { + "epoch": 9.28, + "eval_loss": 0.9390785694122314, + "eval_runtime": 521.094, + "eval_samples_per_second": 14.66, + "eval_wer": 0.3297407015637954, + "step": 62800 + }, + { + "epoch": 9.29, + "learning_rate": 5.375370919881307e-06, + "loss": 0.9978, + "step": 62840 + }, + { + "epoch": 9.29, + "eval_loss": 0.8889870047569275, + "eval_runtime": 521.2433, + "eval_samples_per_second": 14.655, + "eval_wer": 0.3270533748820721, + "step": 62840 + }, + { + "epoch": 9.29, + "learning_rate": 5.372403560830861e-06, + "loss": 0.9811, + "step": 62880 + }, + { + "epoch": 9.29, + "eval_loss": 0.8811739683151245, + "eval_runtime": 520.39, + "eval_samples_per_second": 14.679, + "eval_wer": 0.326738900483147, + "step": 62880 + }, + { + "epoch": 9.3, + "learning_rate": 5.369436201780416e-06, + "loss": 1.0129, + "step": 62920 + }, + { + "epoch": 9.3, + "eval_loss": 0.8766217827796936, + "eval_runtime": 519.6404, + "eval_samples_per_second": 14.701, + "eval_wer": 0.3264816032476629, + "step": 62920 + }, + { + "epoch": 9.31, + "learning_rate": 5.36646884272997e-06, + "loss": 0.9447, + "step": 62960 + }, + { + "epoch": 9.31, + "eval_loss": 0.9186463952064514, + "eval_runtime": 521.2816, + "eval_samples_per_second": 14.654, + "eval_wer": 0.3282540953143315, + "step": 62960 + }, + { + "epoch": 9.31, + "learning_rate": 5.363501483679525e-06, + "loss": 0.9757, + "step": 63000 + }, + { + "epoch": 9.31, + "eval_loss": 0.8648829460144043, + "eval_runtime": 521.9464, + "eval_samples_per_second": 14.636, + "eval_wer": 0.32490923125303756, + "step": 63000 + }, + { + "epoch": 9.32, + "learning_rate": 5.360534124629081e-06, + "loss": 1.0058, + "step": 63040 + }, + { + "epoch": 9.32, + "eval_loss": 0.8797416687011719, + "eval_runtime": 524.691, + "eval_samples_per_second": 14.559, + "eval_wer": 0.32668172331970613, + "step": 63040 + }, + { + "epoch": 9.32, + "learning_rate": 5.357566765578636e-06, + "loss": 0.902, + "step": 63080 + }, + { + "epoch": 9.32, + "eval_loss": 0.890945315361023, + "eval_runtime": 520.7206, + "eval_samples_per_second": 14.67, + "eval_wer": 0.32796820949712685, + "step": 63080 + }, + { + "epoch": 9.33, + "learning_rate": 5.35459940652819e-06, + "loss": 0.9287, + "step": 63120 + }, + { + "epoch": 9.33, + "eval_loss": 0.9338799118995667, + "eval_runtime": 522.6954, + "eval_samples_per_second": 14.615, + "eval_wer": 0.33145601646702305, + "step": 63120 + }, + { + "epoch": 9.34, + "learning_rate": 5.351632047477745e-06, + "loss": 0.9447, + "step": 63160 + }, + { + "epoch": 9.34, + "eval_loss": 0.8940207362174988, + "eval_runtime": 522.8312, + "eval_samples_per_second": 14.611, + "eval_wer": 0.32796820949712685, + "step": 63160 + }, + { + "epoch": 9.34, + "learning_rate": 5.348664688427299e-06, + "loss": 1.0104, + "step": 63200 + }, + { + "epoch": 9.34, + "eval_loss": 0.8592666387557983, + "eval_runtime": 521.743, + "eval_samples_per_second": 14.641, + "eval_wer": 0.3250235855799194, + "step": 63200 + }, + { + "epoch": 9.35, + "learning_rate": 5.345697329376855e-06, + "loss": 0.9282, + "step": 63240 + }, + { + "epoch": 9.35, + "eval_loss": 0.9148645401000977, + "eval_runtime": 523.7757, + "eval_samples_per_second": 14.584, + "eval_wer": 0.328968809857343, + "step": 63240 + }, + { + "epoch": 9.35, + "learning_rate": 5.34272997032641e-06, + "loss": 1.0496, + "step": 63280 + }, + { + "epoch": 9.35, + "eval_loss": 0.9117149710655212, + "eval_runtime": 520.2403, + "eval_samples_per_second": 14.684, + "eval_wer": 0.32853998113153604, + "step": 63280 + }, + { + "epoch": 9.36, + "learning_rate": 5.339762611275965e-06, + "loss": 0.9584, + "step": 63320 + }, + { + "epoch": 9.36, + "eval_loss": 0.8774061799049377, + "eval_runtime": 521.5113, + "eval_samples_per_second": 14.648, + "eval_wer": 0.32651019182938334, + "step": 63320 + }, + { + "epoch": 9.37, + "learning_rate": 5.3367952522255196e-06, + "loss": 0.9567, + "step": 63360 + }, + { + "epoch": 9.37, + "eval_loss": 0.9026126861572266, + "eval_runtime": 521.1637, + "eval_samples_per_second": 14.658, + "eval_wer": 0.327853855170245, + "step": 63360 + }, + { + "epoch": 9.37, + "learning_rate": 5.333827893175074e-06, + "loss": 0.9695, + "step": 63400 + }, + { + "epoch": 9.37, + "eval_loss": 0.9164305925369263, + "eval_runtime": 522.1853, + "eval_samples_per_second": 14.629, + "eval_wer": 0.32951199291003175, + "step": 63400 + }, + { + "epoch": 9.38, + "learning_rate": 5.33086053412463e-06, + "loss": 0.9978, + "step": 63440 + }, + { + "epoch": 9.38, + "eval_loss": 0.8856332898139954, + "eval_runtime": 521.8398, + "eval_samples_per_second": 14.639, + "eval_wer": 0.32688184339174936, + "step": 63440 + }, + { + "epoch": 9.38, + "learning_rate": 5.327893175074185e-06, + "loss": 0.9788, + "step": 63480 + }, + { + "epoch": 9.38, + "eval_loss": 0.9038870334625244, + "eval_runtime": 522.2365, + "eval_samples_per_second": 14.627, + "eval_wer": 0.32779667800680407, + "step": 63480 + }, + { + "epoch": 9.39, + "learning_rate": 5.324925816023739e-06, + "loss": 0.9346, + "step": 63520 + }, + { + "epoch": 9.39, + "eval_loss": 0.930433988571167, + "eval_runtime": 527.653, + "eval_samples_per_second": 14.477, + "eval_wer": 0.32956917007347264, + "step": 63520 + }, + { + "epoch": 9.4, + "learning_rate": 5.321958456973294e-06, + "loss": 1.0508, + "step": 63560 + }, + { + "epoch": 9.4, + "eval_loss": 0.8858340978622437, + "eval_runtime": 520.8648, + "eval_samples_per_second": 14.666, + "eval_wer": 0.3266245461562652, + "step": 63560 + }, + { + "epoch": 9.4, + "learning_rate": 5.318991097922849e-06, + "loss": 0.9768, + "step": 63600 + }, + { + "epoch": 9.4, + "eval_loss": 0.9302107691764832, + "eval_runtime": 521.0888, + "eval_samples_per_second": 14.66, + "eval_wer": 0.32985505589067726, + "step": 63600 + }, + { + "epoch": 9.41, + "learning_rate": 5.316023738872405e-06, + "loss": 0.8673, + "step": 63640 + }, + { + "epoch": 9.41, + "eval_loss": 0.9720991253852844, + "eval_runtime": 521.2821, + "eval_samples_per_second": 14.654, + "eval_wer": 0.3325995597358415, + "step": 63640 + }, + { + "epoch": 9.41, + "learning_rate": 5.313056379821959e-06, + "loss": 0.9993, + "step": 63680 + }, + { + "epoch": 9.41, + "eval_loss": 0.9731243848800659, + "eval_runtime": 521.9256, + "eval_samples_per_second": 14.636, + "eval_wer": 0.33334286286057346, + "step": 63680 + }, + { + "epoch": 9.42, + "learning_rate": 5.310089020771514e-06, + "loss": 1.035, + "step": 63720 + }, + { + "epoch": 9.42, + "eval_loss": 0.8896510004997253, + "eval_runtime": 519.6811, + "eval_samples_per_second": 14.699, + "eval_wer": 0.3275679693530404, + "step": 63720 + }, + { + "epoch": 9.42, + "learning_rate": 5.307121661721068e-06, + "loss": 1.0397, + "step": 63760 + }, + { + "epoch": 9.42, + "eval_loss": 0.8909620046615601, + "eval_runtime": 522.2854, + "eval_samples_per_second": 14.626, + "eval_wer": 0.3269961977186312, + "step": 63760 + }, + { + "epoch": 9.43, + "learning_rate": 5.3041543026706235e-06, + "loss": 0.9421, + "step": 63800 + }, + { + "epoch": 9.43, + "eval_loss": 0.8983649015426636, + "eval_runtime": 520.6856, + "eval_samples_per_second": 14.671, + "eval_wer": 0.32848280396809515, + "step": 63800 + }, + { + "epoch": 9.44, + "learning_rate": 5.301186943620178e-06, + "loss": 0.9547, + "step": 63840 + }, + { + "epoch": 9.44, + "eval_loss": 0.8870012760162354, + "eval_runtime": 520.4979, + "eval_samples_per_second": 14.676, + "eval_wer": 0.32782526658852457, + "step": 63840 + }, + { + "epoch": 9.44, + "learning_rate": 5.298219584569734e-06, + "loss": 1.0335, + "step": 63880 + }, + { + "epoch": 9.44, + "eval_loss": 0.8790306448936462, + "eval_runtime": 520.1698, + "eval_samples_per_second": 14.686, + "eval_wer": 0.3271391406272335, + "step": 63880 + }, + { + "epoch": 9.45, + "learning_rate": 5.2952522255192885e-06, + "loss": 0.973, + "step": 63920 + }, + { + "epoch": 9.45, + "eval_loss": 0.9126614928245544, + "eval_runtime": 521.2591, + "eval_samples_per_second": 14.655, + "eval_wer": 0.3296835244003545, + "step": 63920 + }, + { + "epoch": 9.45, + "learning_rate": 5.292284866468843e-06, + "loss": 0.916, + "step": 63960 + }, + { + "epoch": 9.45, + "eval_loss": 0.9147560000419617, + "eval_runtime": 519.9566, + "eval_samples_per_second": 14.692, + "eval_wer": 0.3295405814917522, + "step": 63960 + }, + { + "epoch": 9.46, + "learning_rate": 5.2893175074183974e-06, + "loss": 0.9699, + "step": 64000 + }, + { + "epoch": 9.46, + "eval_loss": 0.9218246340751648, + "eval_runtime": 521.0774, + "eval_samples_per_second": 14.66, + "eval_wer": 0.3298836444723977, + "step": 64000 + }, + { + "epoch": 9.47, + "learning_rate": 5.286350148367953e-06, + "loss": 0.9648, + "step": 64040 + }, + { + "epoch": 9.47, + "eval_loss": 0.9000306129455566, + "eval_runtime": 520.8242, + "eval_samples_per_second": 14.667, + "eval_wer": 0.32782526658852457, + "step": 64040 + }, + { + "epoch": 9.47, + "learning_rate": 5.283382789317508e-06, + "loss": 0.9997, + "step": 64080 + }, + { + "epoch": 9.47, + "eval_loss": 0.9146038889884949, + "eval_runtime": 521.7171, + "eval_samples_per_second": 14.642, + "eval_wer": 0.32891163269390206, + "step": 64080 + }, + { + "epoch": 9.48, + "learning_rate": 5.280415430267063e-06, + "loss": 1.0384, + "step": 64120 + }, + { + "epoch": 9.48, + "eval_loss": 0.9392070174217224, + "eval_runtime": 520.9797, + "eval_samples_per_second": 14.663, + "eval_wer": 0.3309985991594957, + "step": 64120 + }, + { + "epoch": 9.48, + "learning_rate": 5.277448071216618e-06, + "loss": 0.9187, + "step": 64160 + }, + { + "epoch": 9.48, + "eval_loss": 0.9069005250930786, + "eval_runtime": 520.5167, + "eval_samples_per_second": 14.676, + "eval_wer": 0.32942622716487036, + "step": 64160 + }, + { + "epoch": 9.49, + "learning_rate": 5.274480712166172e-06, + "loss": 0.9569, + "step": 64200 + }, + { + "epoch": 9.49, + "eval_loss": 0.9210803508758545, + "eval_runtime": 521.058, + "eval_samples_per_second": 14.661, + "eval_wer": 0.3310843649046571, + "step": 64200 + }, + { + "epoch": 9.5, + "learning_rate": 5.271513353115727e-06, + "loss": 1.0001, + "step": 64240 + }, + { + "epoch": 9.5, + "eval_loss": 0.8720433115959167, + "eval_runtime": 521.2045, + "eval_samples_per_second": 14.656, + "eval_wer": 0.3260241859401355, + "step": 64240 + }, + { + "epoch": 9.5, + "learning_rate": 5.268545994065283e-06, + "loss": 1.0305, + "step": 64280 + }, + { + "epoch": 9.5, + "eval_loss": 0.9021037817001343, + "eval_runtime": 519.4996, + "eval_samples_per_second": 14.705, + "eval_wer": 0.3300551759627205, + "step": 64280 + }, + { + "epoch": 9.51, + "learning_rate": 5.265578635014837e-06, + "loss": 0.893, + "step": 64320 + }, + { + "epoch": 9.51, + "eval_loss": 0.8933009505271912, + "eval_runtime": 520.0573, + "eval_samples_per_second": 14.689, + "eval_wer": 0.32796820949712685, + "step": 64320 + }, + { + "epoch": 9.51, + "learning_rate": 5.2626112759643925e-06, + "loss": 0.9715, + "step": 64360 + }, + { + "epoch": 9.51, + "eval_loss": 0.8452712893486023, + "eval_runtime": 520.3627, + "eval_samples_per_second": 14.68, + "eval_wer": 0.32410875096486463, + "step": 64360 + }, + { + "epoch": 9.52, + "learning_rate": 5.259643916913947e-06, + "loss": 1.0749, + "step": 64400 + }, + { + "epoch": 9.52, + "eval_loss": 0.911861002445221, + "eval_runtime": 522.3127, + "eval_samples_per_second": 14.625, + "eval_wer": 0.3294548157465908, + "step": 64400 + }, + { + "epoch": 9.53, + "learning_rate": 5.256676557863501e-06, + "loss": 1.0358, + "step": 64440 + }, + { + "epoch": 9.53, + "eval_loss": 0.888854444026947, + "eval_runtime": 519.8825, + "eval_samples_per_second": 14.694, + "eval_wer": 0.32759655793476083, + "step": 64440 + }, + { + "epoch": 9.53, + "learning_rate": 5.2537091988130575e-06, + "loss": 0.9841, + "step": 64480 + }, + { + "epoch": 9.53, + "eval_loss": 0.84819495677948, + "eval_runtime": 521.2455, + "eval_samples_per_second": 14.655, + "eval_wer": 0.324566168272392, + "step": 64480 + }, + { + "epoch": 9.54, + "learning_rate": 5.250741839762612e-06, + "loss": 1.0052, + "step": 64520 + }, + { + "epoch": 9.54, + "eval_loss": 0.8873188495635986, + "eval_runtime": 521.8439, + "eval_samples_per_second": 14.638, + "eval_wer": 0.3279396209154064, + "step": 64520 + }, + { + "epoch": 9.54, + "learning_rate": 5.247774480712166e-06, + "loss": 0.9726, + "step": 64560 + }, + { + "epoch": 9.54, + "eval_loss": 0.868062436580658, + "eval_runtime": 520.4316, + "eval_samples_per_second": 14.678, + "eval_wer": 0.32688184339174936, + "step": 64560 + }, + { + "epoch": 9.55, + "learning_rate": 5.244807121661722e-06, + "loss": 0.9364, + "step": 64600 + }, + { + "epoch": 9.55, + "eval_loss": 0.934567928314209, + "eval_runtime": 521.7763, + "eval_samples_per_second": 14.64, + "eval_wer": 0.33139883930358216, + "step": 64600 + }, + { + "epoch": 9.55, + "learning_rate": 5.241839762611276e-06, + "loss": 1.0294, + "step": 64640 + }, + { + "epoch": 9.55, + "eval_loss": 0.9039771556854248, + "eval_runtime": 519.3468, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3293118728379885, + "step": 64640 + }, + { + "epoch": 9.56, + "learning_rate": 5.238872403560831e-06, + "loss": 1.0801, + "step": 64680 + }, + { + "epoch": 9.56, + "eval_loss": 0.9151927828788757, + "eval_runtime": 519.7591, + "eval_samples_per_second": 14.697, + "eval_wer": 0.32994082163583865, + "step": 64680 + }, + { + "epoch": 9.57, + "learning_rate": 5.235905044510387e-06, + "loss": 1.0288, + "step": 64720 + }, + { + "epoch": 9.57, + "eval_loss": 0.8815693855285645, + "eval_runtime": 519.7265, + "eval_samples_per_second": 14.698, + "eval_wer": 0.3279110323336859, + "step": 64720 + }, + { + "epoch": 9.57, + "learning_rate": 5.232937685459941e-06, + "loss": 0.9962, + "step": 64760 + }, + { + "epoch": 9.57, + "eval_loss": 0.8934894800186157, + "eval_runtime": 521.767, + "eval_samples_per_second": 14.641, + "eval_wer": 0.3284256268046542, + "step": 64760 + }, + { + "epoch": 9.58, + "learning_rate": 5.229970326409496e-06, + "loss": 1.0266, + "step": 64800 + }, + { + "epoch": 9.58, + "eval_loss": 0.8994660973548889, + "eval_runtime": 520.2574, + "eval_samples_per_second": 14.683, + "eval_wer": 0.3291975185111067, + "step": 64800 + }, + { + "epoch": 9.58, + "learning_rate": 5.227002967359051e-06, + "loss": 0.974, + "step": 64840 + }, + { + "epoch": 9.58, + "eval_loss": 0.9028300642967224, + "eval_runtime": 521.3141, + "eval_samples_per_second": 14.653, + "eval_wer": 0.32914034134766573, + "step": 64840 + }, + { + "epoch": 9.59, + "learning_rate": 5.224035608308605e-06, + "loss": 0.9539, + "step": 64880 + }, + { + "epoch": 9.59, + "eval_loss": 0.9245048761367798, + "eval_runtime": 522.8037, + "eval_samples_per_second": 14.612, + "eval_wer": 0.3296263472369136, + "step": 64880 + }, + { + "epoch": 9.6, + "learning_rate": 5.2210682492581614e-06, + "loss": 0.9765, + "step": 64920 + }, + { + "epoch": 9.6, + "eval_loss": 0.9380620718002319, + "eval_runtime": 521.0051, + "eval_samples_per_second": 14.662, + "eval_wer": 0.3309985991594957, + "step": 64920 + }, + { + "epoch": 9.6, + "learning_rate": 5.218100890207716e-06, + "loss": 0.9918, + "step": 64960 + }, + { + "epoch": 9.6, + "eval_loss": 0.9069708585739136, + "eval_runtime": 521.0187, + "eval_samples_per_second": 14.662, + "eval_wer": 0.32856856971325654, + "step": 64960 + }, + { + "epoch": 9.61, + "learning_rate": 5.21513353115727e-06, + "loss": 0.9701, + "step": 65000 + }, + { + "epoch": 9.61, + "eval_loss": 0.917822539806366, + "eval_runtime": 522.0475, + "eval_samples_per_second": 14.633, + "eval_wer": 0.32908316418422484, + "step": 65000 + }, + { + "epoch": 9.61, + "learning_rate": 5.212166172106825e-06, + "loss": 0.964, + "step": 65040 + }, + { + "epoch": 9.61, + "eval_loss": 0.8908485770225525, + "eval_runtime": 520.9089, + "eval_samples_per_second": 14.665, + "eval_wer": 0.32702478630035164, + "step": 65040 + }, + { + "epoch": 9.62, + "learning_rate": 5.20919881305638e-06, + "loss": 0.9459, + "step": 65080 + }, + { + "epoch": 9.62, + "eval_loss": 0.9283452033996582, + "eval_runtime": 522.4683, + "eval_samples_per_second": 14.621, + "eval_wer": 0.32905457560250434, + "step": 65080 + }, + { + "epoch": 9.63, + "learning_rate": 5.206231454005935e-06, + "loss": 0.981, + "step": 65120 + }, + { + "epoch": 9.63, + "eval_loss": 0.8879848718643188, + "eval_runtime": 519.042, + "eval_samples_per_second": 14.717, + "eval_wer": 0.3269676091369107, + "step": 65120 + }, + { + "epoch": 9.63, + "learning_rate": 5.203264094955491e-06, + "loss": 0.9447, + "step": 65160 + }, + { + "epoch": 9.63, + "eval_loss": 0.926645040512085, + "eval_runtime": 518.8844, + "eval_samples_per_second": 14.722, + "eval_wer": 0.32925469567454757, + "step": 65160 + }, + { + "epoch": 9.64, + "learning_rate": 5.200296735905045e-06, + "loss": 0.9487, + "step": 65200 + }, + { + "epoch": 9.64, + "eval_loss": 0.9194495677947998, + "eval_runtime": 521.5585, + "eval_samples_per_second": 14.646, + "eval_wer": 0.3284256268046542, + "step": 65200 + }, + { + "epoch": 9.64, + "learning_rate": 5.1973293768545995e-06, + "loss": 0.9704, + "step": 65240 + }, + { + "epoch": 9.64, + "eval_loss": 0.8458552360534668, + "eval_runtime": 521.7181, + "eval_samples_per_second": 14.642, + "eval_wer": 0.32396580805626235, + "step": 65240 + }, + { + "epoch": 9.65, + "learning_rate": 5.194362017804154e-06, + "loss": 0.9568, + "step": 65280 + }, + { + "epoch": 9.65, + "eval_loss": 0.8653109669685364, + "eval_runtime": 520.3753, + "eval_samples_per_second": 14.68, + "eval_wer": 0.32482346550787616, + "step": 65280 + }, + { + "epoch": 9.66, + "learning_rate": 5.19139465875371e-06, + "loss": 0.9167, + "step": 65320 + }, + { + "epoch": 9.66, + "eval_loss": 0.8854416608810425, + "eval_runtime": 521.3796, + "eval_samples_per_second": 14.652, + "eval_wer": 0.326052774521856, + "step": 65320 + }, + { + "epoch": 9.66, + "learning_rate": 5.1884272997032645e-06, + "loss": 0.9727, + "step": 65360 + }, + { + "epoch": 9.66, + "eval_loss": 0.8713550567626953, + "eval_runtime": 521.735, + "eval_samples_per_second": 14.642, + "eval_wer": 0.3253666485605649, + "step": 65360 + }, + { + "epoch": 9.67, + "learning_rate": 5.18545994065282e-06, + "loss": 1.036, + "step": 65400 + }, + { + "epoch": 9.67, + "eval_loss": 0.8529122471809387, + "eval_runtime": 521.8725, + "eval_samples_per_second": 14.638, + "eval_wer": 0.32410875096486463, + "step": 65400 + }, + { + "epoch": 9.67, + "learning_rate": 5.182492581602374e-06, + "loss": 1.0706, + "step": 65440 + }, + { + "epoch": 9.67, + "eval_loss": 0.8716095685958862, + "eval_runtime": 520.6935, + "eval_samples_per_second": 14.671, + "eval_wer": 0.3250807627433603, + "step": 65440 + }, + { + "epoch": 9.68, + "learning_rate": 5.179525222551929e-06, + "loss": 0.994, + "step": 65480 + }, + { + "epoch": 9.68, + "eval_loss": 0.8643802404403687, + "eval_runtime": 520.5585, + "eval_samples_per_second": 14.675, + "eval_wer": 0.3247091111809943, + "step": 65480 + }, + { + "epoch": 9.69, + "learning_rate": 5.176557863501485e-06, + "loss": 0.9199, + "step": 65520 + }, + { + "epoch": 9.69, + "eval_loss": 0.8754771947860718, + "eval_runtime": 521.2987, + "eval_samples_per_second": 14.654, + "eval_wer": 0.32533805997884446, + "step": 65520 + }, + { + "epoch": 9.69, + "learning_rate": 5.173590504451039e-06, + "loss": 0.9807, + "step": 65560 + }, + { + "epoch": 9.69, + "eval_loss": 0.9002275466918945, + "eval_runtime": 519.0576, + "eval_samples_per_second": 14.717, + "eval_wer": 0.32599559735841505, + "step": 65560 + }, + { + "epoch": 9.7, + "learning_rate": 5.170623145400594e-06, + "loss": 0.9425, + "step": 65600 + }, + { + "epoch": 9.7, + "eval_loss": 0.9267570972442627, + "eval_runtime": 521.0609, + "eval_samples_per_second": 14.66, + "eval_wer": 0.32848280396809515, + "step": 65600 + }, + { + "epoch": 9.7, + "learning_rate": 5.167655786350149e-06, + "loss": 1.0029, + "step": 65640 + }, + { + "epoch": 9.7, + "eval_loss": 0.8965702652931213, + "eval_runtime": 520.1691, + "eval_samples_per_second": 14.686, + "eval_wer": 0.3264530146659424, + "step": 65640 + }, + { + "epoch": 9.71, + "learning_rate": 5.1646884272997035e-06, + "loss": 0.9269, + "step": 65680 + }, + { + "epoch": 9.71, + "eval_loss": 0.9374476671218872, + "eval_runtime": 524.4014, + "eval_samples_per_second": 14.567, + "eval_wer": 0.32956917007347264, + "step": 65680 + }, + { + "epoch": 9.71, + "learning_rate": 5.161721068249259e-06, + "loss": 0.9201, + "step": 65720 + }, + { + "epoch": 9.71, + "eval_loss": 0.9041420221328735, + "eval_runtime": 519.4117, + "eval_samples_per_second": 14.707, + "eval_wer": 0.3276823236799222, + "step": 65720 + }, + { + "epoch": 9.72, + "learning_rate": 5.158753709198814e-06, + "loss": 0.9099, + "step": 65760 + }, + { + "epoch": 9.72, + "eval_loss": 0.9010626077651978, + "eval_runtime": 520.5925, + "eval_samples_per_second": 14.674, + "eval_wer": 0.3270533748820721, + "step": 65760 + }, + { + "epoch": 9.73, + "learning_rate": 5.1557863501483685e-06, + "loss": 0.9696, + "step": 65800 + }, + { + "epoch": 9.73, + "eval_loss": 0.8868222236633301, + "eval_runtime": 519.1888, + "eval_samples_per_second": 14.713, + "eval_wer": 0.3253666485605649, + "step": 65800 + }, + { + "epoch": 9.73, + "learning_rate": 5.152818991097923e-06, + "loss": 0.9471, + "step": 65840 + }, + { + "epoch": 9.73, + "eval_loss": 0.9160571694374084, + "eval_runtime": 520.036, + "eval_samples_per_second": 14.689, + "eval_wer": 0.32731067211755627, + "step": 65840 + }, + { + "epoch": 9.74, + "learning_rate": 5.149851632047478e-06, + "loss": 0.9145, + "step": 65880 + }, + { + "epoch": 9.74, + "eval_loss": 0.875485897064209, + "eval_runtime": 519.9988, + "eval_samples_per_second": 14.69, + "eval_wer": 0.3243374596186283, + "step": 65880 + }, + { + "epoch": 9.74, + "learning_rate": 5.146884272997033e-06, + "loss": 0.9752, + "step": 65920 + }, + { + "epoch": 9.74, + "eval_loss": 0.9192938804626465, + "eval_runtime": 519.7851, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3279967980788473, + "step": 65920 + }, + { + "epoch": 9.75, + "learning_rate": 5.143916913946588e-06, + "loss": 1.0071, + "step": 65960 + }, + { + "epoch": 9.75, + "eval_loss": 0.8947373032569885, + "eval_runtime": 521.2527, + "eval_samples_per_second": 14.655, + "eval_wer": 0.32668172331970613, + "step": 65960 + }, + { + "epoch": 9.76, + "learning_rate": 5.140949554896143e-06, + "loss": 0.9202, + "step": 66000 + }, + { + "epoch": 9.76, + "eval_loss": 0.9317971467971802, + "eval_runtime": 520.809, + "eval_samples_per_second": 14.668, + "eval_wer": 0.3293976385831499, + "step": 66000 + }, + { + "epoch": 9.76, + "learning_rate": 5.137982195845698e-06, + "loss": 0.9795, + "step": 66040 + }, + { + "epoch": 9.76, + "eval_loss": 0.8823733925819397, + "eval_runtime": 520.5468, + "eval_samples_per_second": 14.675, + "eval_wer": 0.3255095914691672, + "step": 66040 + }, + { + "epoch": 9.77, + "learning_rate": 5.135014836795252e-06, + "loss": 0.9917, + "step": 66080 + }, + { + "epoch": 9.77, + "eval_loss": 0.9035821557044983, + "eval_runtime": 522.3509, + "eval_samples_per_second": 14.624, + "eval_wer": 0.3269676091369107, + "step": 66080 + }, + { + "epoch": 9.77, + "learning_rate": 5.132047477744807e-06, + "loss": 1.0487, + "step": 66120 + }, + { + "epoch": 9.77, + "eval_loss": 0.8938897252082825, + "eval_runtime": 518.1694, + "eval_samples_per_second": 14.742, + "eval_wer": 0.32608136310357644, + "step": 66120 + }, + { + "epoch": 9.78, + "learning_rate": 5.129080118694363e-06, + "loss": 1.0176, + "step": 66160 + }, + { + "epoch": 9.78, + "eval_loss": 0.8860788941383362, + "eval_runtime": 519.8834, + "eval_samples_per_second": 14.694, + "eval_wer": 0.3254524143057263, + "step": 66160 + }, + { + "epoch": 9.79, + "learning_rate": 5.126112759643917e-06, + "loss": 1.0223, + "step": 66200 + }, + { + "epoch": 9.79, + "eval_loss": 0.8981444835662842, + "eval_runtime": 519.724, + "eval_samples_per_second": 14.698, + "eval_wer": 0.3269676091369107, + "step": 66200 + }, + { + "epoch": 9.79, + "learning_rate": 5.1231454005934724e-06, + "loss": 1.0241, + "step": 66240 + }, + { + "epoch": 9.79, + "eval_loss": 0.8599478006362915, + "eval_runtime": 522.0523, + "eval_samples_per_second": 14.633, + "eval_wer": 0.3235655679121759, + "step": 66240 + }, + { + "epoch": 9.8, + "learning_rate": 5.120178041543027e-06, + "loss": 0.9318, + "step": 66280 + }, + { + "epoch": 9.8, + "eval_loss": 0.8916246891021729, + "eval_runtime": 524.9773, + "eval_samples_per_second": 14.551, + "eval_wer": 0.3260241859401355, + "step": 66280 + }, + { + "epoch": 9.8, + "learning_rate": 5.117210682492581e-06, + "loss": 0.9596, + "step": 66320 + }, + { + "epoch": 9.8, + "eval_loss": 0.8819082975387573, + "eval_runtime": 521.6243, + "eval_samples_per_second": 14.645, + "eval_wer": 0.32533805997884446, + "step": 66320 + }, + { + "epoch": 9.81, + "learning_rate": 5.1142433234421375e-06, + "loss": 0.9446, + "step": 66360 + }, + { + "epoch": 9.81, + "eval_loss": 0.880855917930603, + "eval_runtime": 519.1233, + "eval_samples_per_second": 14.715, + "eval_wer": 0.32530947139712396, + "step": 66360 + }, + { + "epoch": 9.82, + "learning_rate": 5.111275964391692e-06, + "loss": 1.0143, + "step": 66400 + }, + { + "epoch": 9.82, + "eval_loss": 0.9238023161888123, + "eval_runtime": 519.962, + "eval_samples_per_second": 14.691, + "eval_wer": 0.3283684496412133, + "step": 66400 + }, + { + "epoch": 9.82, + "learning_rate": 5.108308605341246e-06, + "loss": 1.0188, + "step": 66440 + }, + { + "epoch": 9.82, + "eval_loss": 0.8921962976455688, + "eval_runtime": 518.7456, + "eval_samples_per_second": 14.726, + "eval_wer": 0.3257383001229309, + "step": 66440 + }, + { + "epoch": 9.83, + "learning_rate": 5.105341246290802e-06, + "loss": 1.0049, + "step": 66480 + }, + { + "epoch": 9.83, + "eval_loss": 0.9202232360839844, + "eval_runtime": 519.738, + "eval_samples_per_second": 14.698, + "eval_wer": 0.32908316418422484, + "step": 66480 + }, + { + "epoch": 9.83, + "learning_rate": 5.102373887240356e-06, + "loss": 0.9496, + "step": 66520 + }, + { + "epoch": 9.83, + "eval_loss": 0.9338187575340271, + "eval_runtime": 519.7874, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3293976385831499, + "step": 66520 + }, + { + "epoch": 9.84, + "learning_rate": 5.099406528189912e-06, + "loss": 0.9074, + "step": 66560 + }, + { + "epoch": 9.84, + "eval_loss": 0.9405819177627563, + "eval_runtime": 521.6088, + "eval_samples_per_second": 14.645, + "eval_wer": 0.3293690500014294, + "step": 66560 + }, + { + "epoch": 9.84, + "learning_rate": 5.096439169139467e-06, + "loss": 0.9166, + "step": 66600 + }, + { + "epoch": 9.84, + "eval_loss": 0.9684476256370544, + "eval_runtime": 520.4367, + "eval_samples_per_second": 14.678, + "eval_wer": 0.3316561365390663, + "step": 66600 + }, + { + "epoch": 9.85, + "learning_rate": 5.093471810089021e-06, + "loss": 0.9439, + "step": 66640 + }, + { + "epoch": 9.85, + "eval_loss": 0.9049162268638611, + "eval_runtime": 525.417, + "eval_samples_per_second": 14.539, + "eval_wer": 0.32659595757454474, + "step": 66640 + }, + { + "epoch": 9.86, + "learning_rate": 5.0905044510385755e-06, + "loss": 0.9587, + "step": 66680 + }, + { + "epoch": 9.86, + "eval_loss": 0.8936130404472351, + "eval_runtime": 521.3215, + "eval_samples_per_second": 14.653, + "eval_wer": 0.32593842019497415, + "step": 66680 + }, + { + "epoch": 9.86, + "learning_rate": 5.087537091988131e-06, + "loss": 0.9692, + "step": 66720 + }, + { + "epoch": 9.86, + "eval_loss": 0.8982540965080261, + "eval_runtime": 522.3791, + "eval_samples_per_second": 14.623, + "eval_wer": 0.32636724892078106, + "step": 66720 + }, + { + "epoch": 9.87, + "learning_rate": 5.084569732937686e-06, + "loss": 0.9479, + "step": 66760 + }, + { + "epoch": 9.87, + "eval_loss": 0.912302553653717, + "eval_runtime": 520.7727, + "eval_samples_per_second": 14.669, + "eval_wer": 0.32736784928099716, + "step": 66760 + }, + { + "epoch": 9.87, + "learning_rate": 5.081602373887241e-06, + "loss": 0.9893, + "step": 66800 + }, + { + "epoch": 9.87, + "eval_loss": 0.8948932886123657, + "eval_runtime": 521.5706, + "eval_samples_per_second": 14.646, + "eval_wer": 0.3265673689928243, + "step": 66800 + }, + { + "epoch": 9.88, + "learning_rate": 5.078635014836796e-06, + "loss": 1.1502, + "step": 66840 + }, + { + "epoch": 9.88, + "eval_loss": 0.9114333987236023, + "eval_runtime": 520.38, + "eval_samples_per_second": 14.68, + "eval_wer": 0.3275107921895995, + "step": 66840 + }, + { + "epoch": 9.89, + "learning_rate": 5.07566765578635e-06, + "loss": 1.0671, + "step": 66880 + }, + { + "epoch": 9.89, + "eval_loss": 0.9288748502731323, + "eval_runtime": 524.4667, + "eval_samples_per_second": 14.565, + "eval_wer": 0.3284542153863747, + "step": 66880 + }, + { + "epoch": 9.89, + "learning_rate": 5.072700296735905e-06, + "loss": 1.0816, + "step": 66920 + }, + { + "epoch": 9.89, + "eval_loss": 0.8821796178817749, + "eval_runtime": 521.7504, + "eval_samples_per_second": 14.641, + "eval_wer": 0.32556676863260814, + "step": 66920 + }, + { + "epoch": 9.9, + "learning_rate": 5.06973293768546e-06, + "loss": 1.0234, + "step": 66960 + }, + { + "epoch": 9.9, + "eval_loss": 0.8622782230377197, + "eval_runtime": 520.9596, + "eval_samples_per_second": 14.663, + "eval_wer": 0.32402298521970324, + "step": 66960 + }, + { + "epoch": 9.9, + "learning_rate": 5.066765578635015e-06, + "loss": 0.9492, + "step": 67000 + }, + { + "epoch": 9.9, + "eval_loss": 0.8956637382507324, + "eval_runtime": 520.7376, + "eval_samples_per_second": 14.67, + "eval_wer": 0.3260241859401355, + "step": 67000 + }, + { + "epoch": 9.91, + "learning_rate": 5.063798219584571e-06, + "loss": 0.9558, + "step": 67040 + }, + { + "epoch": 9.91, + "eval_loss": 0.8826231956481934, + "eval_runtime": 522.2875, + "eval_samples_per_second": 14.626, + "eval_wer": 0.3251665284885217, + "step": 67040 + }, + { + "epoch": 9.92, + "learning_rate": 5.060830860534125e-06, + "loss": 1.0034, + "step": 67080 + }, + { + "epoch": 9.92, + "eval_loss": 0.8922444581985474, + "eval_runtime": 519.7193, + "eval_samples_per_second": 14.698, + "eval_wer": 0.32642442608422195, + "step": 67080 + }, + { + "epoch": 9.92, + "learning_rate": 5.0578635014836795e-06, + "loss": 1.0837, + "step": 67120 + }, + { + "epoch": 9.92, + "eval_loss": 0.8789015412330627, + "eval_runtime": 523.7211, + "eval_samples_per_second": 14.586, + "eval_wer": 0.3255381800508877, + "step": 67120 + }, + { + "epoch": 9.93, + "learning_rate": 5.054896142433235e-06, + "loss": 0.9558, + "step": 67160 + }, + { + "epoch": 9.93, + "eval_loss": 0.9017727375030518, + "eval_runtime": 519.627, + "eval_samples_per_second": 14.701, + "eval_wer": 0.32665313473798563, + "step": 67160 + }, + { + "epoch": 9.93, + "learning_rate": 5.05192878338279e-06, + "loss": 1.036, + "step": 67200 + }, + { + "epoch": 9.93, + "eval_loss": 0.8582212924957275, + "eval_runtime": 520.8384, + "eval_samples_per_second": 14.667, + "eval_wer": 0.32336544784013266, + "step": 67200 + }, + { + "epoch": 9.94, + "learning_rate": 5.0489614243323445e-06, + "loss": 0.9534, + "step": 67240 + }, + { + "epoch": 9.94, + "eval_loss": 0.9113368391990662, + "eval_runtime": 522.2359, + "eval_samples_per_second": 14.627, + "eval_wer": 0.327482203607879, + "step": 67240 + }, + { + "epoch": 9.95, + "learning_rate": 5.0459940652819e-06, + "loss": 1.0424, + "step": 67280 + }, + { + "epoch": 9.95, + "eval_loss": 0.851280152797699, + "eval_runtime": 522.9704, + "eval_samples_per_second": 14.607, + "eval_wer": 0.3225363789702393, + "step": 67280 + }, + { + "epoch": 9.95, + "learning_rate": 5.043026706231454e-06, + "loss": 1.0009, + "step": 67320 + }, + { + "epoch": 9.95, + "eval_loss": 0.8853794932365417, + "eval_runtime": 520.4759, + "eval_samples_per_second": 14.677, + "eval_wer": 0.326052774521856, + "step": 67320 + }, + { + "epoch": 9.96, + "learning_rate": 5.040059347181009e-06, + "loss": 0.9924, + "step": 67360 + }, + { + "epoch": 9.96, + "eval_loss": 0.912270188331604, + "eval_runtime": 520.4995, + "eval_samples_per_second": 14.676, + "eval_wer": 0.32759655793476083, + "step": 67360 + }, + { + "epoch": 9.96, + "learning_rate": 5.037091988130565e-06, + "loss": 1.0416, + "step": 67400 + }, + { + "epoch": 9.96, + "eval_loss": 0.8639053702354431, + "eval_runtime": 520.2965, + "eval_samples_per_second": 14.682, + "eval_wer": 0.3243374596186283, + "step": 67400 + }, + { + "epoch": 9.97, + "learning_rate": 5.034124629080119e-06, + "loss": 0.9758, + "step": 67440 + }, + { + "epoch": 9.97, + "eval_loss": 0.8846729397773743, + "eval_runtime": 521.4295, + "eval_samples_per_second": 14.65, + "eval_wer": 0.32608136310357644, + "step": 67440 + }, + { + "epoch": 9.97, + "learning_rate": 5.031157270029674e-06, + "loss": 0.9483, + "step": 67480 + }, + { + "epoch": 9.97, + "eval_loss": 0.8801016807556152, + "eval_runtime": 521.2861, + "eval_samples_per_second": 14.654, + "eval_wer": 0.3261099516852969, + "step": 67480 + }, + { + "epoch": 9.98, + "learning_rate": 5.028189910979229e-06, + "loss": 1.0733, + "step": 67520 + }, + { + "epoch": 9.98, + "eval_loss": 0.8609018325805664, + "eval_runtime": 531.9105, + "eval_samples_per_second": 14.361, + "eval_wer": 0.32445181394551015, + "step": 67520 + }, + { + "epoch": 9.99, + "learning_rate": 5.025222551928783e-06, + "loss": 0.9401, + "step": 67560 + }, + { + "epoch": 9.99, + "eval_loss": 0.8885067701339722, + "eval_runtime": 521.1465, + "eval_samples_per_second": 14.658, + "eval_wer": 0.3268246662283084, + "step": 67560 + }, + { + "epoch": 9.99, + "learning_rate": 5.0222551928783396e-06, + "loss": 0.9864, + "step": 67600 + }, + { + "epoch": 9.99, + "eval_loss": 0.8686002492904663, + "eval_runtime": 521.183, + "eval_samples_per_second": 14.657, + "eval_wer": 0.3255095914691672, + "step": 67600 + }, + { + "epoch": 10.0, + "learning_rate": 5.019287833827894e-06, + "loss": 0.9447, + "step": 67640 + }, + { + "epoch": 10.0, + "eval_loss": 0.867267370223999, + "eval_runtime": 522.519, + "eval_samples_per_second": 14.62, + "eval_wer": 0.32505217416163984, + "step": 67640 + }, + { + "epoch": 10.0, + "learning_rate": 5.0163204747774484e-06, + "loss": 1.0504, + "step": 67680 + }, + { + "epoch": 10.0, + "eval_loss": 0.8603226542472839, + "eval_runtime": 523.8832, + "eval_samples_per_second": 14.581, + "eval_wer": 0.32482346550787616, + "step": 67680 + }, + { + "epoch": 10.01, + "learning_rate": 5.013353115727003e-06, + "loss": 0.9393, + "step": 67720 + }, + { + "epoch": 10.01, + "eval_loss": 0.887373149394989, + "eval_runtime": 521.6212, + "eval_samples_per_second": 14.645, + "eval_wer": 0.3269676091369107, + "step": 67720 + }, + { + "epoch": 10.02, + "learning_rate": 5.010385756676558e-06, + "loss": 0.9343, + "step": 67760 + }, + { + "epoch": 10.02, + "eval_loss": 0.915393054485321, + "eval_runtime": 520.0607, + "eval_samples_per_second": 14.689, + "eval_wer": 0.328597158294977, + "step": 67760 + }, + { + "epoch": 10.02, + "learning_rate": 5.0074183976261135e-06, + "loss": 0.9681, + "step": 67800 + }, + { + "epoch": 10.02, + "eval_loss": 0.8972141146659851, + "eval_runtime": 519.7733, + "eval_samples_per_second": 14.697, + "eval_wer": 0.3277395008433632, + "step": 67800 + }, + { + "epoch": 10.03, + "learning_rate": 5.004451038575669e-06, + "loss": 0.9328, + "step": 67840 + }, + { + "epoch": 10.03, + "eval_loss": 0.9027385115623474, + "eval_runtime": 518.8021, + "eval_samples_per_second": 14.724, + "eval_wer": 0.3279967980788473, + "step": 67840 + }, + { + "epoch": 10.03, + "learning_rate": 5.001483679525223e-06, + "loss": 0.9443, + "step": 67880 + }, + { + "epoch": 10.03, + "eval_loss": 0.8928678035736084, + "eval_runtime": 519.6746, + "eval_samples_per_second": 14.7, + "eval_wer": 0.3265673689928243, + "step": 67880 + }, + { + "epoch": 10.04, + "learning_rate": 4.998516320474778e-06, + "loss": 0.8907, + "step": 67920 + }, + { + "epoch": 10.04, + "eval_loss": 0.9327033758163452, + "eval_runtime": 519.136, + "eval_samples_per_second": 14.715, + "eval_wer": 0.3288830441121816, + "step": 67920 + }, + { + "epoch": 10.05, + "learning_rate": 4.995548961424333e-06, + "loss": 1.05, + "step": 67960 + }, + { + "epoch": 10.05, + "eval_loss": 0.8715218901634216, + "eval_runtime": 519.7165, + "eval_samples_per_second": 14.698, + "eval_wer": 0.3245089911089511, + "step": 67960 + }, + { + "epoch": 10.05, + "learning_rate": 4.992581602373887e-06, + "loss": 0.9604, + "step": 68000 + }, + { + "epoch": 10.05, + "eval_loss": 0.8848233819007874, + "eval_runtime": 519.6201, + "eval_samples_per_second": 14.701, + "eval_wer": 0.3257097115412104, + "step": 68000 + }, + { + "epoch": 10.06, + "learning_rate": 4.989614243323443e-06, + "loss": 0.9819, + "step": 68040 + }, + { + "epoch": 10.06, + "eval_loss": 0.9014686346054077, + "eval_runtime": 520.6224, + "eval_samples_per_second": 14.673, + "eval_wer": 0.3264816032476629, + "step": 68040 + }, + { + "epoch": 10.06, + "learning_rate": 4.986646884272998e-06, + "loss": 1.0349, + "step": 68080 + }, + { + "epoch": 10.06, + "eval_loss": 0.8478845953941345, + "eval_runtime": 519.3592, + "eval_samples_per_second": 14.709, + "eval_wer": 0.3227364990422825, + "step": 68080 + }, + { + "epoch": 10.07, + "learning_rate": 4.983679525222552e-06, + "loss": 1.0287, + "step": 68120 + }, + { + "epoch": 10.07, + "eval_loss": 0.8555676341056824, + "eval_runtime": 520.2487, + "eval_samples_per_second": 14.683, + "eval_wer": 0.3242802824551874, + "step": 68120 + }, + { + "epoch": 10.08, + "learning_rate": 4.980712166172107e-06, + "loss": 0.9722, + "step": 68160 + }, + { + "epoch": 10.08, + "eval_loss": 0.8866252899169922, + "eval_runtime": 519.5172, + "eval_samples_per_second": 14.704, + "eval_wer": 0.3269676091369107, + "step": 68160 + }, + { + "epoch": 10.08, + "learning_rate": 4.977744807121662e-06, + "loss": 1.0095, + "step": 68200 + }, + { + "epoch": 10.08, + "eval_loss": 0.8848801255226135, + "eval_runtime": 519.2243, + "eval_samples_per_second": 14.712, + "eval_wer": 0.3263958375025015, + "step": 68200 + }, + { + "epoch": 10.09, + "learning_rate": 4.9747774480712166e-06, + "loss": 0.9708, + "step": 68240 + }, + { + "epoch": 10.09, + "eval_loss": 0.8520979881286621, + "eval_runtime": 519.4554, + "eval_samples_per_second": 14.706, + "eval_wer": 0.32382286514766, + "step": 68240 + }, + { + "epoch": 10.09, + "learning_rate": 4.971810089020772e-06, + "loss": 0.9008, + "step": 68280 + }, + { + "epoch": 10.09, + "eval_loss": 0.8952348828315735, + "eval_runtime": 520.9594, + "eval_samples_per_second": 14.663, + "eval_wer": 0.32693902055519025, + "step": 68280 + }, + { + "epoch": 10.1, + "learning_rate": 4.968842729970327e-06, + "loss": 0.9823, + "step": 68320 + }, + { + "epoch": 10.1, + "eval_loss": 0.8546443581581116, + "eval_runtime": 520.3416, + "eval_samples_per_second": 14.681, + "eval_wer": 0.3233940364218531, + "step": 68320 + }, + { + "epoch": 10.1, + "learning_rate": 4.9658753709198816e-06, + "loss": 1.0789, + "step": 68360 + }, + { + "epoch": 10.1, + "eval_loss": 0.9444647431373596, + "eval_runtime": 520.9569, + "eval_samples_per_second": 14.663, + "eval_wer": 0.3298836444723977, + "step": 68360 + }, + { + "epoch": 10.11, + "learning_rate": 4.962908011869437e-06, + "loss": 0.9451, + "step": 68400 + }, + { + "epoch": 10.11, + "eval_loss": 0.8898735642433167, + "eval_runtime": 519.8119, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3265387804111038, + "step": 68400 + }, + { + "epoch": 10.12, + "learning_rate": 4.959940652818991e-06, + "loss": 0.9306, + "step": 68440 + }, + { + "epoch": 10.12, + "eval_loss": 0.9030724167823792, + "eval_runtime": 519.9474, + "eval_samples_per_second": 14.692, + "eval_wer": 0.327853855170245, + "step": 68440 + }, + { + "epoch": 10.12, + "learning_rate": 4.956973293768547e-06, + "loss": 0.9497, + "step": 68480 + }, + { + "epoch": 10.12, + "eval_loss": 0.8822644352912903, + "eval_runtime": 518.9053, + "eval_samples_per_second": 14.721, + "eval_wer": 0.3257097115412104, + "step": 68480 + }, + { + "epoch": 10.13, + "learning_rate": 4.954005934718101e-06, + "loss": 0.9681, + "step": 68520 + }, + { + "epoch": 10.13, + "eval_loss": 0.8775320053100586, + "eval_runtime": 519.0025, + "eval_samples_per_second": 14.719, + "eval_wer": 0.32513793990680123, + "step": 68520 + }, + { + "epoch": 10.13, + "learning_rate": 4.951038575667656e-06, + "loss": 0.9448, + "step": 68560 + }, + { + "epoch": 10.13, + "eval_loss": 0.8945602774620056, + "eval_runtime": 520.1941, + "eval_samples_per_second": 14.685, + "eval_wer": 0.3261099516852969, + "step": 68560 + }, + { + "epoch": 10.14, + "learning_rate": 4.948071216617212e-06, + "loss": 0.9475, + "step": 68600 + }, + { + "epoch": 10.14, + "eval_loss": 0.893030047416687, + "eval_runtime": 519.5841, + "eval_samples_per_second": 14.702, + "eval_wer": 0.32585265444981276, + "step": 68600 + }, + { + "epoch": 10.15, + "learning_rate": 4.945103857566766e-06, + "loss": 0.9846, + "step": 68640 + }, + { + "epoch": 10.15, + "eval_loss": 0.8857608437538147, + "eval_runtime": 520.1839, + "eval_samples_per_second": 14.685, + "eval_wer": 0.32565253437776953, + "step": 68640 + }, + { + "epoch": 10.15, + "learning_rate": 4.9421364985163205e-06, + "loss": 0.9528, + "step": 68680 + }, + { + "epoch": 10.15, + "eval_loss": 0.8953890204429626, + "eval_runtime": 519.008, + "eval_samples_per_second": 14.718, + "eval_wer": 0.3255953572143286, + "step": 68680 + }, + { + "epoch": 10.16, + "learning_rate": 4.939169139465876e-06, + "loss": 0.9439, + "step": 68720 + }, + { + "epoch": 10.16, + "eval_loss": 0.9016136527061462, + "eval_runtime": 520.5151, + "eval_samples_per_second": 14.676, + "eval_wer": 0.3259670087766946, + "step": 68720 + }, + { + "epoch": 10.16, + "learning_rate": 4.93620178041543e-06, + "loss": 0.9644, + "step": 68760 + }, + { + "epoch": 10.16, + "eval_loss": 0.9108134508132935, + "eval_runtime": 520.8842, + "eval_samples_per_second": 14.665, + "eval_wer": 0.32708196346379254, + "step": 68760 + }, + { + "epoch": 10.17, + "learning_rate": 4.9332344213649855e-06, + "loss": 0.9902, + "step": 68800 + }, + { + "epoch": 10.17, + "eval_loss": 0.884946882724762, + "eval_runtime": 520.6698, + "eval_samples_per_second": 14.671, + "eval_wer": 0.32525229423368307, + "step": 68800 + }, + { + "epoch": 10.18, + "learning_rate": 4.930267062314541e-06, + "loss": 0.9801, + "step": 68840 + }, + { + "epoch": 10.18, + "eval_loss": 0.8763694763183594, + "eval_runtime": 520.5775, + "eval_samples_per_second": 14.674, + "eval_wer": 0.3241373395465851, + "step": 68840 + }, + { + "epoch": 10.18, + "learning_rate": 4.927299703264095e-06, + "loss": 0.9829, + "step": 68880 + }, + { + "epoch": 10.18, + "eval_loss": 0.8888580799102783, + "eval_runtime": 521.3114, + "eval_samples_per_second": 14.653, + "eval_wer": 0.32548100288744675, + "step": 68880 + }, + { + "epoch": 10.19, + "learning_rate": 4.9243323442136505e-06, + "loss": 0.941, + "step": 68920 + }, + { + "epoch": 10.19, + "eval_loss": 0.8793805837631226, + "eval_runtime": 521.0236, + "eval_samples_per_second": 14.662, + "eval_wer": 0.3250235855799194, + "step": 68920 + }, + { + "epoch": 10.19, + "learning_rate": 4.921364985163205e-06, + "loss": 0.8921, + "step": 68960 + }, + { + "epoch": 10.19, + "eval_loss": 0.8705631494522095, + "eval_runtime": 519.8345, + "eval_samples_per_second": 14.695, + "eval_wer": 0.32482346550787616, + "step": 68960 + }, + { + "epoch": 10.2, + "learning_rate": 4.91839762611276e-06, + "loss": 1.0995, + "step": 69000 + }, + { + "epoch": 10.2, + "eval_loss": 0.8404164910316467, + "eval_runtime": 520.925, + "eval_samples_per_second": 14.664, + "eval_wer": 0.322021784499271, + "step": 69000 + }, + { + "epoch": 10.21, + "learning_rate": 4.915430267062315e-06, + "loss": 1.0096, + "step": 69040 + }, + { + "epoch": 10.21, + "eval_loss": 0.8529436588287354, + "eval_runtime": 519.9045, + "eval_samples_per_second": 14.693, + "eval_wer": 0.32299379627776664, + "step": 69040 + }, + { + "epoch": 10.21, + "learning_rate": 4.91246290801187e-06, + "loss": 0.8961, + "step": 69080 + }, + { + "epoch": 10.21, + "eval_loss": 0.9113124012947083, + "eval_runtime": 520.8261, + "eval_samples_per_second": 14.667, + "eval_wer": 0.32759655793476083, + "step": 69080 + }, + { + "epoch": 10.22, + "learning_rate": 4.909495548961425e-06, + "loss": 1.0192, + "step": 69120 + }, + { + "epoch": 10.22, + "eval_loss": 0.8700169324874878, + "eval_runtime": 524.9671, + "eval_samples_per_second": 14.551, + "eval_wer": 0.32445181394551015, + "step": 69120 + }, + { + "epoch": 10.22, + "learning_rate": 4.90652818991098e-06, + "loss": 0.9803, + "step": 69160 + }, + { + "epoch": 10.22, + "eval_loss": 0.8752796053886414, + "eval_runtime": 519.7739, + "eval_samples_per_second": 14.697, + "eval_wer": 0.324566168272392, + "step": 69160 + }, + { + "epoch": 10.23, + "learning_rate": 4.903560830860534e-06, + "loss": 0.9103, + "step": 69200 + }, + { + "epoch": 10.23, + "eval_loss": 0.865210771560669, + "eval_runtime": 520.7878, + "eval_samples_per_second": 14.668, + "eval_wer": 0.32396580805626235, + "step": 69200 + }, + { + "epoch": 10.24, + "learning_rate": 4.9005934718100895e-06, + "loss": 0.9767, + "step": 69240 + }, + { + "epoch": 10.24, + "eval_loss": 0.8533618450164795, + "eval_runtime": 520.9914, + "eval_samples_per_second": 14.662, + "eval_wer": 0.32265073329712113, + "step": 69240 + }, + { + "epoch": 10.24, + "learning_rate": 4.897626112759644e-06, + "loss": 0.9659, + "step": 69280 + }, + { + "epoch": 10.24, + "eval_loss": 0.8541852831840515, + "eval_runtime": 522.2259, + "eval_samples_per_second": 14.628, + "eval_wer": 0.3226793218788416, + "step": 69280 + }, + { + "epoch": 10.25, + "learning_rate": 4.894658753709199e-06, + "loss": 0.9956, + "step": 69320 + }, + { + "epoch": 10.25, + "eval_loss": 0.863059937953949, + "eval_runtime": 520.858, + "eval_samples_per_second": 14.666, + "eval_wer": 0.32276508762400297, + "step": 69320 + }, + { + "epoch": 10.25, + "learning_rate": 4.8916913946587545e-06, + "loss": 1.0389, + "step": 69360 + }, + { + "epoch": 10.25, + "eval_loss": 0.8505798578262329, + "eval_runtime": 525.5601, + "eval_samples_per_second": 14.535, + "eval_wer": 0.32213613882615283, + "step": 69360 + }, + { + "epoch": 10.26, + "learning_rate": 4.888724035608309e-06, + "loss": 0.9305, + "step": 69400 + }, + { + "epoch": 10.26, + "eval_loss": 0.8797439932823181, + "eval_runtime": 521.1722, + "eval_samples_per_second": 14.657, + "eval_wer": 0.3236227450756168, + "step": 69400 + }, + { + "epoch": 10.26, + "learning_rate": 4.885756676557864e-06, + "loss": 1.0258, + "step": 69440 + }, + { + "epoch": 10.26, + "eval_loss": 0.8905665874481201, + "eval_runtime": 521.8144, + "eval_samples_per_second": 14.639, + "eval_wer": 0.32430887103690786, + "step": 69440 + }, + { + "epoch": 10.27, + "learning_rate": 4.882789317507419e-06, + "loss": 0.9568, + "step": 69480 + }, + { + "epoch": 10.27, + "eval_loss": 0.8786068558692932, + "eval_runtime": 521.627, + "eval_samples_per_second": 14.645, + "eval_wer": 0.323136739186369, + "step": 69480 + }, + { + "epoch": 10.28, + "learning_rate": 4.879821958456974e-06, + "loss": 1.099, + "step": 69520 + }, + { + "epoch": 10.28, + "eval_loss": 0.9136019349098206, + "eval_runtime": 523.0948, + "eval_samples_per_second": 14.603, + "eval_wer": 0.326738900483147, + "step": 69520 + }, + { + "epoch": 10.28, + "learning_rate": 4.876854599406528e-06, + "loss": 0.9568, + "step": 69560 + }, + { + "epoch": 10.28, + "eval_loss": 0.8350768685340881, + "eval_runtime": 521.2349, + "eval_samples_per_second": 14.656, + "eval_wer": 0.3211927156293776, + "step": 69560 + }, + { + "epoch": 10.29, + "learning_rate": 4.873887240356084e-06, + "loss": 0.9558, + "step": 69600 + }, + { + "epoch": 10.29, + "eval_loss": 0.8770838975906372, + "eval_runtime": 520.3594, + "eval_samples_per_second": 14.68, + "eval_wer": 0.32388004231110096, + "step": 69600 + }, + { + "epoch": 10.29, + "learning_rate": 4.870919881305638e-06, + "loss": 0.9485, + "step": 69640 + }, + { + "epoch": 10.29, + "eval_loss": 0.9053707122802734, + "eval_runtime": 520.6726, + "eval_samples_per_second": 14.671, + "eval_wer": 0.3259670087766946, + "step": 69640 + }, + { + "epoch": 10.3, + "learning_rate": 4.867952522255193e-06, + "loss": 0.9942, + "step": 69680 + }, + { + "epoch": 10.3, + "eval_loss": 0.8666454553604126, + "eval_runtime": 520.8291, + "eval_samples_per_second": 14.667, + "eval_wer": 0.32256496755195974, + "step": 69680 + }, + { + "epoch": 10.31, + "learning_rate": 4.864985163204748e-06, + "loss": 0.95, + "step": 69720 + }, + { + "epoch": 10.31, + "eval_loss": 0.8948246836662292, + "eval_runtime": 520.0228, + "eval_samples_per_second": 14.69, + "eval_wer": 0.32462334543583293, + "step": 69720 + }, + { + "epoch": 10.31, + "learning_rate": 4.862017804154303e-06, + "loss": 0.962, + "step": 69760 + }, + { + "epoch": 10.31, + "eval_loss": 0.9286537170410156, + "eval_runtime": 520.3667, + "eval_samples_per_second": 14.68, + "eval_wer": 0.3277395008433632, + "step": 69760 + }, + { + "epoch": 10.32, + "learning_rate": 4.859050445103858e-06, + "loss": 0.9754, + "step": 69800 + }, + { + "epoch": 10.32, + "eval_loss": 0.9044238328933716, + "eval_runtime": 520.4914, + "eval_samples_per_second": 14.677, + "eval_wer": 0.32548100288744675, + "step": 69800 + }, + { + "epoch": 10.32, + "learning_rate": 4.856083086053413e-06, + "loss": 1.0, + "step": 69840 + }, + { + "epoch": 10.32, + "eval_loss": 0.8822633624076843, + "eval_runtime": 520.5102, + "eval_samples_per_second": 14.676, + "eval_wer": 0.3238514537293805, + "step": 69840 + }, + { + "epoch": 10.33, + "learning_rate": 4.853115727002968e-06, + "loss": 1.0474, + "step": 69880 + }, + { + "epoch": 10.33, + "eval_loss": 0.8866599798202515, + "eval_runtime": 520.1319, + "eval_samples_per_second": 14.687, + "eval_wer": 0.3237085108207782, + "step": 69880 + }, + { + "epoch": 10.34, + "learning_rate": 4.850148367952523e-06, + "loss": 1.0089, + "step": 69920 + }, + { + "epoch": 10.34, + "eval_loss": 0.8930904865264893, + "eval_runtime": 520.2657, + "eval_samples_per_second": 14.683, + "eval_wer": 0.3236513336573373, + "step": 69920 + }, + { + "epoch": 10.34, + "learning_rate": 4.847181008902078e-06, + "loss": 0.9994, + "step": 69960 + }, + { + "epoch": 10.34, + "eval_loss": 0.866547167301178, + "eval_runtime": 519.6931, + "eval_samples_per_second": 14.699, + "eval_wer": 0.3227364990422825, + "step": 69960 + }, + { + "epoch": 10.35, + "learning_rate": 4.844213649851632e-06, + "loss": 0.927, + "step": 70000 + }, + { + "epoch": 10.35, + "eval_loss": 0.9207704663276672, + "eval_runtime": 520.4449, + "eval_samples_per_second": 14.678, + "eval_wer": 0.32590983161325365, + "step": 70000 + }, + { + "epoch": 10.35, + "learning_rate": 4.841246290801188e-06, + "loss": 0.9742, + "step": 70040 + }, + { + "epoch": 10.35, + "eval_loss": 0.9033421874046326, + "eval_runtime": 521.1649, + "eval_samples_per_second": 14.658, + "eval_wer": 0.32448040252723065, + "step": 70040 + }, + { + "epoch": 10.36, + "learning_rate": 4.838278931750742e-06, + "loss": 0.951, + "step": 70080 + }, + { + "epoch": 10.36, + "eval_loss": 0.8707385063171387, + "eval_runtime": 521.7732, + "eval_samples_per_second": 14.64, + "eval_wer": 0.32250779038851884, + "step": 70080 + }, + { + "epoch": 10.37, + "learning_rate": 4.835311572700297e-06, + "loss": 0.9406, + "step": 70120 + }, + { + "epoch": 10.37, + "eval_loss": 0.9025798439979553, + "eval_runtime": 520.6072, + "eval_samples_per_second": 14.673, + "eval_wer": 0.32473769976271477, + "step": 70120 + }, + { + "epoch": 10.37, + "learning_rate": 4.832344213649852e-06, + "loss": 0.9382, + "step": 70160 + }, + { + "epoch": 10.37, + "eval_loss": 0.9063680768013, + "eval_runtime": 519.6691, + "eval_samples_per_second": 14.7, + "eval_wer": 0.3252808828154035, + "step": 70160 + }, + { + "epoch": 10.38, + "learning_rate": 4.829376854599407e-06, + "loss": 0.9484, + "step": 70200 + }, + { + "epoch": 10.38, + "eval_loss": 0.8975633978843689, + "eval_runtime": 520.3955, + "eval_samples_per_second": 14.679, + "eval_wer": 0.32505217416163984, + "step": 70200 + }, + { + "epoch": 10.38, + "learning_rate": 4.8264094955489615e-06, + "loss": 0.9278, + "step": 70240 + }, + { + "epoch": 10.38, + "eval_loss": 0.9052666425704956, + "eval_runtime": 520.2799, + "eval_samples_per_second": 14.682, + "eval_wer": 0.3248520540895966, + "step": 70240 + }, + { + "epoch": 10.39, + "learning_rate": 4.823442136498517e-06, + "loss": 0.9595, + "step": 70280 + }, + { + "epoch": 10.39, + "eval_loss": 0.9478540420532227, + "eval_runtime": 521.4602, + "eval_samples_per_second": 14.649, + "eval_wer": 0.32753938077131994, + "step": 70280 + }, + { + "epoch": 10.39, + "learning_rate": 4.820474777448071e-06, + "loss": 0.8641, + "step": 70320 + }, + { + "epoch": 10.39, + "eval_loss": 0.9234895706176758, + "eval_runtime": 519.9417, + "eval_samples_per_second": 14.692, + "eval_wer": 0.32642442608422195, + "step": 70320 + }, + { + "epoch": 10.4, + "learning_rate": 4.8175074183976265e-06, + "loss": 0.9098, + "step": 70360 + }, + { + "epoch": 10.4, + "eval_loss": 0.8805803060531616, + "eval_runtime": 520.6164, + "eval_samples_per_second": 14.673, + "eval_wer": 0.3236227450756168, + "step": 70360 + }, + { + "epoch": 10.41, + "learning_rate": 4.814540059347181e-06, + "loss": 1.0238, + "step": 70400 + }, + { + "epoch": 10.41, + "eval_loss": 0.8794459700584412, + "eval_runtime": 520.5516, + "eval_samples_per_second": 14.675, + "eval_wer": 0.32327968209497127, + "step": 70400 + }, + { + "epoch": 10.41, + "learning_rate": 4.811572700296736e-06, + "loss": 0.9531, + "step": 70440 + }, + { + "epoch": 10.41, + "eval_loss": 0.8738023042678833, + "eval_runtime": 520.9524, + "eval_samples_per_second": 14.664, + "eval_wer": 0.3226793218788416, + "step": 70440 + }, + { + "epoch": 10.42, + "learning_rate": 4.8086053412462916e-06, + "loss": 0.9162, + "step": 70480 + }, + { + "epoch": 10.42, + "eval_loss": 0.9220749139785767, + "eval_runtime": 519.7937, + "eval_samples_per_second": 14.696, + "eval_wer": 0.3257097115412104, + "step": 70480 + }, + { + "epoch": 10.42, + "learning_rate": 4.805637982195846e-06, + "loss": 0.9298, + "step": 70520 + }, + { + "epoch": 10.42, + "eval_loss": 0.9116944670677185, + "eval_runtime": 520.3225, + "eval_samples_per_second": 14.681, + "eval_wer": 0.3252237056519626, + "step": 70520 + }, + { + "epoch": 10.43, + "learning_rate": 4.802670623145401e-06, + "loss": 0.9405, + "step": 70560 + }, + { + "epoch": 10.43, + "eval_loss": 0.9383991360664368, + "eval_runtime": 521.1487, + "eval_samples_per_second": 14.658, + "eval_wer": 0.3272249063723949, + "step": 70560 + }, + { + "epoch": 10.44, + "learning_rate": 4.799703264094956e-06, + "loss": 0.9481, + "step": 70600 + }, + { + "epoch": 10.44, + "eval_loss": 0.8848059177398682, + "eval_runtime": 522.3537, + "eval_samples_per_second": 14.624, + "eval_wer": 0.3236513336573373, + "step": 70600 + }, + { + "epoch": 10.44, + "learning_rate": 4.79673590504451e-06, + "loss": 1.0222, + "step": 70640 + }, + { + "epoch": 10.44, + "eval_loss": 0.8753991723060608, + "eval_runtime": 522.5012, + "eval_samples_per_second": 14.62, + "eval_wer": 0.32307956202292804, + "step": 70640 + }, + { + "epoch": 10.45, + "learning_rate": 4.7937685459940655e-06, + "loss": 0.9078, + "step": 70680 + }, + { + "epoch": 10.45, + "eval_loss": 0.8681339025497437, + "eval_runtime": 520.8065, + "eval_samples_per_second": 14.668, + "eval_wer": 0.32205037308099144, + "step": 70680 + }, + { + "epoch": 10.45, + "learning_rate": 4.790801186943621e-06, + "loss": 0.9506, + "step": 70720 + }, + { + "epoch": 10.45, + "eval_loss": 0.9011270999908447, + "eval_runtime": 521.7086, + "eval_samples_per_second": 14.642, + "eval_wer": 0.32410875096486463, + "step": 70720 + }, + { + "epoch": 10.46, + "learning_rate": 4.787833827893175e-06, + "loss": 0.9749, + "step": 70760 + }, + { + "epoch": 10.46, + "eval_loss": 0.8979442715644836, + "eval_runtime": 520.5289, + "eval_samples_per_second": 14.675, + "eval_wer": 0.3231653277680894, + "step": 70760 + }, + { + "epoch": 10.47, + "learning_rate": 4.7848664688427305e-06, + "loss": 0.9435, + "step": 70800 + }, + { + "epoch": 10.47, + "eval_loss": 0.8887069225311279, + "eval_runtime": 520.4877, + "eval_samples_per_second": 14.677, + "eval_wer": 0.32293661911432575, + "step": 70800 + }, + { + "epoch": 10.47, + "learning_rate": 4.781899109792285e-06, + "loss": 0.9725, + "step": 70840 + }, + { + "epoch": 10.47, + "eval_loss": 0.8892274498939514, + "eval_runtime": 521.6681, + "eval_samples_per_second": 14.643, + "eval_wer": 0.3227079104605621, + "step": 70840 + }, + { + "epoch": 10.48, + "learning_rate": 4.77893175074184e-06, + "loss": 1.0846, + "step": 70880 + }, + { + "epoch": 10.48, + "eval_loss": 0.8860262632369995, + "eval_runtime": 520.6359, + "eval_samples_per_second": 14.672, + "eval_wer": 0.3228794419508848, + "step": 70880 + }, + { + "epoch": 10.48, + "learning_rate": 4.775964391691395e-06, + "loss": 0.9715, + "step": 70920 + }, + { + "epoch": 10.48, + "eval_loss": 0.9077578783035278, + "eval_runtime": 524.7673, + "eval_samples_per_second": 14.557, + "eval_wer": 0.32453757969067154, + "step": 70920 + }, + { + "epoch": 10.49, + "learning_rate": 4.77299703264095e-06, + "loss": 0.9252, + "step": 70960 + }, + { + "epoch": 10.49, + "eval_loss": 0.9092930555343628, + "eval_runtime": 520.8007, + "eval_samples_per_second": 14.668, + "eval_wer": 0.3250807627433603, + "step": 70960 + }, + { + "epoch": 10.5, + "learning_rate": 4.770029673590505e-06, + "loss": 1.0072, + "step": 71000 + }, + { + "epoch": 10.5, + "eval_loss": 0.8523333668708801, + "eval_runtime": 521.1417, + "eval_samples_per_second": 14.658, + "eval_wer": 0.32102118413905484, + "step": 71000 + }, + { + "epoch": 10.5, + "learning_rate": 4.76706231454006e-06, + "loss": 0.9764, + "step": 71040 + }, + { + "epoch": 10.5, + "eval_loss": 0.848875105381012, + "eval_runtime": 521.2791, + "eval_samples_per_second": 14.654, + "eval_wer": 0.3209925955573344, + "step": 71040 + }, + { + "epoch": 10.51, + "learning_rate": 4.764094955489615e-06, + "loss": 0.9327, + "step": 71080 + }, + { + "epoch": 10.51, + "eval_loss": 0.9033676385879517, + "eval_runtime": 520.8488, + "eval_samples_per_second": 14.666, + "eval_wer": 0.32393721947454185, + "step": 71080 + }, + { + "epoch": 10.51, + "learning_rate": 4.761127596439169e-06, + "loss": 0.9715, + "step": 71120 + }, + { + "epoch": 10.51, + "eval_loss": 0.896257758140564, + "eval_runtime": 520.1501, + "eval_samples_per_second": 14.686, + "eval_wer": 0.3237370994024986, + "step": 71120 + }, + { + "epoch": 10.52, + "learning_rate": 4.758160237388724e-06, + "loss": 0.9763, + "step": 71160 + }, + { + "epoch": 10.52, + "eval_loss": 0.8802129626274109, + "eval_runtime": 520.8581, + "eval_samples_per_second": 14.666, + "eval_wer": 0.3226793218788416, + "step": 71160 + }, + { + "epoch": 10.52, + "learning_rate": 4.755192878338279e-06, + "loss": 0.9363, + "step": 71200 + }, + { + "epoch": 10.52, + "eval_loss": 0.8886792063713074, + "eval_runtime": 520.1716, + "eval_samples_per_second": 14.686, + "eval_wer": 0.32388004231110096, + "step": 71200 + }, + { + "epoch": 10.53, + "learning_rate": 4.7522255192878344e-06, + "loss": 0.9738, + "step": 71240 + }, + { + "epoch": 10.53, + "eval_loss": 0.8836033940315247, + "eval_runtime": 519.8805, + "eval_samples_per_second": 14.694, + "eval_wer": 0.3232510935132508, + "step": 71240 + }, + { + "epoch": 10.54, + "learning_rate": 4.749258160237389e-06, + "loss": 1.0652, + "step": 71280 + }, + { + "epoch": 10.54, + "eval_loss": 0.8500810861587524, + "eval_runtime": 521.86, + "eval_samples_per_second": 14.638, + "eval_wer": 0.32113553846593673, + "step": 71280 + }, + { + "epoch": 10.54, + "learning_rate": 4.746290801186944e-06, + "loss": 0.9597, + "step": 71320 + }, + { + "epoch": 10.54, + "eval_loss": 0.8457416296005249, + "eval_runtime": 521.4444, + "eval_samples_per_second": 14.65, + "eval_wer": 0.3207638869035707, + "step": 71320 + }, + { + "epoch": 10.55, + "learning_rate": 4.743323442136499e-06, + "loss": 1.0061, + "step": 71360 + }, + { + "epoch": 10.55, + "eval_loss": 0.8846386075019836, + "eval_runtime": 523.329, + "eval_samples_per_second": 14.597, + "eval_wer": 0.3232510935132508, + "step": 71360 + }, + { + "epoch": 10.55, + "learning_rate": 4.740356083086054e-06, + "loss": 0.9374, + "step": 71400 + }, + { + "epoch": 10.55, + "eval_loss": 0.872814416885376, + "eval_runtime": 520.0926, + "eval_samples_per_second": 14.688, + "eval_wer": 0.32290803053260525, + "step": 71400 + }, + { + "epoch": 10.56, + "learning_rate": 4.737388724035608e-06, + "loss": 0.9333, + "step": 71440 + }, + { + "epoch": 10.56, + "eval_loss": 0.9094192385673523, + "eval_runtime": 521.9504, + "eval_samples_per_second": 14.635, + "eval_wer": 0.3253666485605649, + "step": 71440 + }, + { + "epoch": 10.57, + "learning_rate": 4.734421364985164e-06, + "loss": 1.038, + "step": 71480 + }, + { + "epoch": 10.57, + "eval_loss": 0.900380551815033, + "eval_runtime": 522.765, + "eval_samples_per_second": 14.613, + "eval_wer": 0.3245089911089511, + "step": 71480 + }, + { + "epoch": 10.57, + "learning_rate": 4.731454005934719e-06, + "loss": 0.9222, + "step": 71520 + }, + { + "epoch": 10.57, + "eval_loss": 0.9000558257102966, + "eval_runtime": 521.5483, + "eval_samples_per_second": 14.647, + "eval_wer": 0.324566168272392, + "step": 71520 + }, + { + "epoch": 10.58, + "learning_rate": 4.728486646884273e-06, + "loss": 0.9437, + "step": 71560 + }, + { + "epoch": 10.58, + "eval_loss": 0.8690860271453857, + "eval_runtime": 520.67, + "eval_samples_per_second": 14.671, + "eval_wer": 0.3217930758455073, + "step": 71560 + }, + { + "epoch": 10.58, + "learning_rate": 4.725519287833829e-06, + "loss": 0.8783, + "step": 71600 + }, + { + "epoch": 10.58, + "eval_loss": 0.8936105966567993, + "eval_runtime": 521.6934, + "eval_samples_per_second": 14.643, + "eval_wer": 0.3234798021670145, + "step": 71600 + }, + { + "epoch": 10.59, + "learning_rate": 4.722551928783383e-06, + "loss": 0.9335, + "step": 71640 + }, + { + "epoch": 10.59, + "eval_loss": 0.8966529965400696, + "eval_runtime": 521.561, + "eval_samples_per_second": 14.646, + "eval_wer": 0.3237370994024986, + "step": 71640 + }, + { + "epoch": 10.6, + "learning_rate": 4.7195845697329375e-06, + "loss": 0.9271, + "step": 71680 + }, + { + "epoch": 10.6, + "eval_loss": 0.8892812728881836, + "eval_runtime": 522.0638, + "eval_samples_per_second": 14.632, + "eval_wer": 0.3231653277680894, + "step": 71680 + }, + { + "epoch": 10.6, + "learning_rate": 4.716617210682493e-06, + "loss": 0.9601, + "step": 71720 + }, + { + "epoch": 10.6, + "eval_loss": 0.8958648443222046, + "eval_runtime": 520.2594, + "eval_samples_per_second": 14.683, + "eval_wer": 0.32393721947454185, + "step": 71720 + }, + { + "epoch": 10.61, + "learning_rate": 4.713649851632048e-06, + "loss": 0.9677, + "step": 71760 + }, + { + "epoch": 10.61, + "eval_loss": 0.8912705779075623, + "eval_runtime": 520.2253, + "eval_samples_per_second": 14.684, + "eval_wer": 0.32382286514766, + "step": 71760 + }, + { + "epoch": 10.61, + "learning_rate": 4.7106824925816025e-06, + "loss": 0.9804, + "step": 71800 + }, + { + "epoch": 10.61, + "eval_loss": 0.871073842048645, + "eval_runtime": 520.979, + "eval_samples_per_second": 14.663, + "eval_wer": 0.3227364990422825, + "step": 71800 + }, + { + "epoch": 10.62, + "learning_rate": 4.707715133531158e-06, + "loss": 0.9544, + "step": 71840 + }, + { + "epoch": 10.62, + "eval_loss": 0.8795429468154907, + "eval_runtime": 520.7409, + "eval_samples_per_second": 14.669, + "eval_wer": 0.32302238485948714, + "step": 71840 + }, + { + "epoch": 10.63, + "learning_rate": 4.704747774480712e-06, + "loss": 0.9949, + "step": 71880 + }, + { + "epoch": 10.63, + "eval_loss": 0.8602790236473083, + "eval_runtime": 519.9555, + "eval_samples_per_second": 14.692, + "eval_wer": 0.32156436719174364, + "step": 71880 + }, + { + "epoch": 10.63, + "learning_rate": 4.7017804154302676e-06, + "loss": 0.9017, + "step": 71920 + }, + { + "epoch": 10.63, + "eval_loss": 0.8819182515144348, + "eval_runtime": 521.7396, + "eval_samples_per_second": 14.641, + "eval_wer": 0.3232225049315304, + "step": 71920 + }, + { + "epoch": 10.64, + "learning_rate": 4.698813056379822e-06, + "loss": 0.9789, + "step": 71960 + }, + { + "epoch": 10.64, + "eval_loss": 0.9399983882904053, + "eval_runtime": 522.8319, + "eval_samples_per_second": 14.611, + "eval_wer": 0.32676748906486747, + "step": 71960 + }, + { + "epoch": 10.64, + "learning_rate": 4.695845697329377e-06, + "loss": 0.9463, + "step": 72000 + }, + { + "epoch": 10.64, + "eval_loss": 0.9292511940002441, + "eval_runtime": 520.183, + "eval_samples_per_second": 14.685, + "eval_wer": 0.32599559735841505, + "step": 72000 + }, + { + "epoch": 10.65, + "learning_rate": 4.692878338278933e-06, + "loss": 0.967, + "step": 72040 + }, + { + "epoch": 10.65, + "eval_loss": 0.9241394996643066, + "eval_runtime": 520.7614, + "eval_samples_per_second": 14.669, + "eval_wer": 0.3260241859401355, + "step": 72040 + }, + { + "epoch": 10.65, + "learning_rate": 4.689910979228487e-06, + "loss": 0.9133, + "step": 72080 + }, + { + "epoch": 10.65, + "eval_loss": 0.903540313243866, + "eval_runtime": 520.7816, + "eval_samples_per_second": 14.668, + "eval_wer": 0.32396580805626235, + "step": 72080 + }, + { + "epoch": 10.66, + "learning_rate": 4.686943620178042e-06, + "loss": 0.9418, + "step": 72120 + }, + { + "epoch": 10.66, + "eval_loss": 0.8934593200683594, + "eval_runtime": 521.3581, + "eval_samples_per_second": 14.652, + "eval_wer": 0.3228222647874439, + "step": 72120 + }, + { + "epoch": 10.67, + "learning_rate": 4.683976261127597e-06, + "loss": 0.944, + "step": 72160 + }, + { + "epoch": 10.67, + "eval_loss": 0.8802918791770935, + "eval_runtime": 521.8829, + "eval_samples_per_second": 14.637, + "eval_wer": 0.3224506132250779, + "step": 72160 + }, + { + "epoch": 10.67, + "learning_rate": 4.681008902077151e-06, + "loss": 0.9282, + "step": 72200 + }, + { + "epoch": 10.67, + "eval_loss": 0.9022666215896606, + "eval_runtime": 521.2972, + "eval_samples_per_second": 14.654, + "eval_wer": 0.32448040252723065, + "step": 72200 + }, + { + "epoch": 10.68, + "learning_rate": 4.6780415430267065e-06, + "loss": 0.9503, + "step": 72240 + }, + { + "epoch": 10.68, + "eval_loss": 0.8996410965919495, + "eval_runtime": 521.2157, + "eval_samples_per_second": 14.656, + "eval_wer": 0.3243374596186283, + "step": 72240 + }, + { + "epoch": 10.68, + "learning_rate": 4.675074183976262e-06, + "loss": 0.9949, + "step": 72280 + }, + { + "epoch": 10.68, + "eval_loss": 0.8651266694068909, + "eval_runtime": 520.787, + "eval_samples_per_second": 14.668, + "eval_wer": 0.32190743017238915, + "step": 72280 + }, + { + "epoch": 10.69, + "learning_rate": 4.672106824925816e-06, + "loss": 0.935, + "step": 72320 + }, + { + "epoch": 10.69, + "eval_loss": 0.8835282921791077, + "eval_runtime": 521.5136, + "eval_samples_per_second": 14.648, + "eval_wer": 0.32350839074873494, + "step": 72320 + }, + { + "epoch": 10.7, + "learning_rate": 4.6691394658753715e-06, + "loss": 1.0497, + "step": 72360 + }, + { + "epoch": 10.7, + "eval_loss": 0.8520467281341553, + "eval_runtime": 520.6793, + "eval_samples_per_second": 14.671, + "eval_wer": 0.32156436719174364, + "step": 72360 + }, + { + "epoch": 10.7, + "learning_rate": 4.666172106824926e-06, + "loss": 0.9092, + "step": 72400 + }, + { + "epoch": 10.7, + "eval_loss": 0.904299795627594, + "eval_runtime": 522.8287, + "eval_samples_per_second": 14.611, + "eval_wer": 0.3254524143057263, + "step": 72400 + }, + { + "epoch": 10.71, + "learning_rate": 4.663204747774481e-06, + "loss": 0.9463, + "step": 72440 + }, + { + "epoch": 10.71, + "eval_loss": 0.9232798218727112, + "eval_runtime": 525.5561, + "eval_samples_per_second": 14.535, + "eval_wer": 0.3262243060121787, + "step": 72440 + }, + { + "epoch": 10.71, + "learning_rate": 4.660237388724036e-06, + "loss": 0.9709, + "step": 72480 + }, + { + "epoch": 10.71, + "eval_loss": 0.8644095659255981, + "eval_runtime": 524.7166, + "eval_samples_per_second": 14.558, + "eval_wer": 0.3215929557734641, + "step": 72480 + }, + { + "epoch": 10.72, + "learning_rate": 4.657270029673591e-06, + "loss": 1.0441, + "step": 72520 + }, + { + "epoch": 10.72, + "eval_loss": 0.8986897468566895, + "eval_runtime": 523.9298, + "eval_samples_per_second": 14.58, + "eval_wer": 0.3241373395465851, + "step": 72520 + }, + { + "epoch": 10.73, + "learning_rate": 4.654302670623146e-06, + "loss": 0.9398, + "step": 72560 + }, + { + "epoch": 10.73, + "eval_loss": 0.8832688331604004, + "eval_runtime": 524.3016, + "eval_samples_per_second": 14.57, + "eval_wer": 0.3227936762057234, + "step": 72560 + }, + { + "epoch": 10.73, + "learning_rate": 4.651335311572701e-06, + "loss": 0.9733, + "step": 72600 + }, + { + "epoch": 10.73, + "eval_loss": 0.8743331432342529, + "eval_runtime": 524.7035, + "eval_samples_per_second": 14.559, + "eval_wer": 0.3221933159895938, + "step": 72600 + }, + { + "epoch": 10.74, + "learning_rate": 4.648367952522256e-06, + "loss": 0.9333, + "step": 72640 + }, + { + "epoch": 10.74, + "eval_loss": 0.9266566038131714, + "eval_runtime": 524.2784, + "eval_samples_per_second": 14.571, + "eval_wer": 0.3264530146659424, + "step": 72640 + }, + { + "epoch": 10.74, + "learning_rate": 4.6454005934718104e-06, + "loss": 0.9602, + "step": 72680 + }, + { + "epoch": 10.74, + "eval_loss": 0.8927357792854309, + "eval_runtime": 525.4728, + "eval_samples_per_second": 14.537, + "eval_wer": 0.32302238485948714, + "step": 72680 + }, + { + "epoch": 10.75, + "learning_rate": 4.642433234421365e-06, + "loss": 0.9851, + "step": 72720 + }, + { + "epoch": 10.75, + "eval_loss": 0.89580237865448, + "eval_runtime": 527.4459, + "eval_samples_per_second": 14.483, + "eval_wer": 0.324194516710026, + "step": 72720 + }, + { + "epoch": 10.76, + "learning_rate": 4.63946587537092e-06, + "loss": 1.031, + "step": 72760 + }, + { + "epoch": 10.76, + "eval_loss": 0.8396863341331482, + "eval_runtime": 523.4582, + "eval_samples_per_second": 14.593, + "eval_wer": 0.31984905228851596, + "step": 72760 + }, + { + "epoch": 10.76, + "learning_rate": 4.6364985163204755e-06, + "loss": 0.9311, + "step": 72800 + }, + { + "epoch": 10.76, + "eval_loss": 0.8570407629013062, + "eval_runtime": 523.7823, + "eval_samples_per_second": 14.584, + "eval_wer": 0.3213356585379799, + "step": 72800 + }, + { + "epoch": 10.77, + "learning_rate": 4.63353115727003e-06, + "loss": 0.9378, + "step": 72840 + }, + { + "epoch": 10.77, + "eval_loss": 0.8933374881744385, + "eval_runtime": 525.3467, + "eval_samples_per_second": 14.541, + "eval_wer": 0.32290803053260525, + "step": 72840 + }, + { + "epoch": 10.77, + "learning_rate": 4.630563798219585e-06, + "loss": 0.9257, + "step": 72880 + }, + { + "epoch": 10.77, + "eval_loss": 0.9002131819725037, + "eval_runtime": 525.7906, + "eval_samples_per_second": 14.529, + "eval_wer": 0.3236227450756168, + "step": 72880 + }, + { + "epoch": 10.78, + "learning_rate": 4.62759643916914e-06, + "loss": 0.9722, + "step": 72920 + }, + { + "epoch": 10.78, + "eval_loss": 0.8562790155410767, + "eval_runtime": 524.8892, + "eval_samples_per_second": 14.554, + "eval_wer": 0.32059235541324793, + "step": 72920 + }, + { + "epoch": 10.78, + "learning_rate": 4.624629080118695e-06, + "loss": 0.9408, + "step": 72960 + }, + { + "epoch": 10.78, + "eval_loss": 0.9242084622383118, + "eval_runtime": 525.0422, + "eval_samples_per_second": 14.549, + "eval_wer": 0.32585265444981276, + "step": 72960 + }, + { + "epoch": 10.79, + "learning_rate": 4.621661721068249e-06, + "loss": 0.9703, + "step": 73000 + }, + { + "epoch": 10.79, + "eval_loss": 0.8803754448890686, + "eval_runtime": 524.4827, + "eval_samples_per_second": 14.565, + "eval_wer": 0.3214500128648618, + "step": 73000 + }, + { + "epoch": 10.8, + "learning_rate": 4.618694362017805e-06, + "loss": 0.9967, + "step": 73040 + }, + { + "epoch": 10.8, + "eval_loss": 0.8814731240272522, + "eval_runtime": 524.8111, + "eval_samples_per_second": 14.556, + "eval_wer": 0.32182166442722776, + "step": 73040 + }, + { + "epoch": 10.8, + "learning_rate": 4.61572700296736e-06, + "loss": 0.9714, + "step": 73080 + }, + { + "epoch": 10.8, + "eval_loss": 0.8946047425270081, + "eval_runtime": 523.7473, + "eval_samples_per_second": 14.585, + "eval_wer": 0.3229652076960462, + "step": 73080 + }, + { + "epoch": 10.81, + "learning_rate": 4.612759643916914e-06, + "loss": 0.9677, + "step": 73120 + }, + { + "epoch": 10.81, + "eval_loss": 0.9137767553329468, + "eval_runtime": 525.7317, + "eval_samples_per_second": 14.53, + "eval_wer": 0.32462334543583293, + "step": 73120 + }, + { + "epoch": 10.81, + "learning_rate": 4.60979228486647e-06, + "loss": 1.0144, + "step": 73160 + }, + { + "epoch": 10.81, + "eval_loss": 0.8741853833198547, + "eval_runtime": 524.9133, + "eval_samples_per_second": 14.553, + "eval_wer": 0.32233625889819606, + "step": 73160 + }, + { + "epoch": 10.82, + "learning_rate": 4.606824925816024e-06, + "loss": 0.9708, + "step": 73200 + }, + { + "epoch": 10.82, + "eval_loss": 0.8897590041160583, + "eval_runtime": 524.0338, + "eval_samples_per_second": 14.577, + "eval_wer": 0.3228794419508848, + "step": 73200 + }, + { + "epoch": 10.83, + "learning_rate": 4.6038575667655786e-06, + "loss": 0.9205, + "step": 73240 + }, + { + "epoch": 10.83, + "eval_loss": 0.8928082585334778, + "eval_runtime": 523.4708, + "eval_samples_per_second": 14.593, + "eval_wer": 0.3231939163498099, + "step": 73240 + }, + { + "epoch": 10.83, + "learning_rate": 4.600890207715134e-06, + "loss": 0.9227, + "step": 73280 + }, + { + "epoch": 10.83, + "eval_loss": 0.9004506468772888, + "eval_runtime": 524.3864, + "eval_samples_per_second": 14.568, + "eval_wer": 0.3238514537293805, + "step": 73280 + }, + { + "epoch": 10.84, + "learning_rate": 4.597922848664689e-06, + "loss": 0.9565, + "step": 73320 + }, + { + "epoch": 10.84, + "eval_loss": 0.8970906138420105, + "eval_runtime": 528.9581, + "eval_samples_per_second": 14.442, + "eval_wer": 0.32353697933045544, + "step": 73320 + }, + { + "epoch": 10.84, + "learning_rate": 4.5949554896142436e-06, + "loss": 0.9446, + "step": 73360 + }, + { + "epoch": 10.84, + "eval_loss": 0.9179455637931824, + "eval_runtime": 523.4575, + "eval_samples_per_second": 14.593, + "eval_wer": 0.3251665284885217, + "step": 73360 + }, + { + "epoch": 10.85, + "learning_rate": 4.591988130563799e-06, + "loss": 0.9818, + "step": 73400 + }, + { + "epoch": 10.85, + "eval_loss": 0.8927173614501953, + "eval_runtime": 524.8299, + "eval_samples_per_second": 14.555, + "eval_wer": 0.3227079104605621, + "step": 73400 + }, + { + "epoch": 10.86, + "learning_rate": 4.589020771513353e-06, + "loss": 0.9459, + "step": 73440 + }, + { + "epoch": 10.86, + "eval_loss": 0.9190839529037476, + "eval_runtime": 524.2324, + "eval_samples_per_second": 14.572, + "eval_wer": 0.32490923125303756, + "step": 73440 + }, + { + "epoch": 10.86, + "learning_rate": 4.586053412462909e-06, + "loss": 0.9711, + "step": 73480 + }, + { + "epoch": 10.86, + "eval_loss": 0.8907099962234497, + "eval_runtime": 524.3043, + "eval_samples_per_second": 14.57, + "eval_wer": 0.3231081506046485, + "step": 73480 + }, + { + "epoch": 10.87, + "learning_rate": 4.583086053412463e-06, + "loss": 0.9907, + "step": 73520 + }, + { + "epoch": 10.87, + "eval_loss": 0.8781489729881287, + "eval_runtime": 525.6235, + "eval_samples_per_second": 14.533, + "eval_wer": 0.3209354183938935, + "step": 73520 + }, + { + "epoch": 10.87, + "learning_rate": 4.580118694362018e-06, + "loss": 0.9833, + "step": 73560 + }, + { + "epoch": 10.87, + "eval_loss": 0.880021333694458, + "eval_runtime": 529.3724, + "eval_samples_per_second": 14.43, + "eval_wer": 0.3215071900283027, + "step": 73560 + }, + { + "epoch": 10.88, + "learning_rate": 4.577151335311573e-06, + "loss": 0.941, + "step": 73600 + }, + { + "epoch": 10.88, + "eval_loss": 0.8843143582344055, + "eval_runtime": 524.277, + "eval_samples_per_second": 14.571, + "eval_wer": 0.3222219045713142, + "step": 73600 + }, + { + "epoch": 10.89, + "learning_rate": 4.574183976261128e-06, + "loss": 0.9319, + "step": 73640 + }, + { + "epoch": 10.89, + "eval_loss": 0.8761234283447266, + "eval_runtime": 523.6765, + "eval_samples_per_second": 14.587, + "eval_wer": 0.3218502530089482, + "step": 73640 + }, + { + "epoch": 10.89, + "learning_rate": 4.571216617210683e-06, + "loss": 0.9896, + "step": 73680 + }, + { + "epoch": 10.89, + "eval_loss": 0.9129985570907593, + "eval_runtime": 526.1525, + "eval_samples_per_second": 14.519, + "eval_wer": 0.3239086308928214, + "step": 73680 + }, + { + "epoch": 10.9, + "learning_rate": 4.568249258160238e-06, + "loss": 0.9725, + "step": 73720 + }, + { + "epoch": 10.9, + "eval_loss": 0.8738813996315002, + "eval_runtime": 525.487, + "eval_samples_per_second": 14.537, + "eval_wer": 0.32182166442722776, + "step": 73720 + }, + { + "epoch": 10.9, + "learning_rate": 4.565281899109792e-06, + "loss": 1.1795, + "step": 73760 + }, + { + "epoch": 10.9, + "eval_loss": 0.8719978928565979, + "eval_runtime": 524.0472, + "eval_samples_per_second": 14.577, + "eval_wer": 0.321650132936905, + "step": 73760 + }, + { + "epoch": 10.91, + "learning_rate": 4.5623145400593475e-06, + "loss": 0.9403, + "step": 73800 + }, + { + "epoch": 10.91, + "eval_loss": 0.8749380111694336, + "eval_runtime": 525.6468, + "eval_samples_per_second": 14.533, + "eval_wer": 0.3213642471197004, + "step": 73800 + }, + { + "epoch": 10.91, + "learning_rate": 4.559347181008903e-06, + "loss": 0.9482, + "step": 73840 + }, + { + "epoch": 10.91, + "eval_loss": 0.878515899181366, + "eval_runtime": 528.7275, + "eval_samples_per_second": 14.448, + "eval_wer": 0.3211927156293776, + "step": 73840 + }, + { + "epoch": 10.92, + "learning_rate": 4.556379821958457e-06, + "loss": 0.9609, + "step": 73880 + }, + { + "epoch": 10.92, + "eval_loss": 0.891594648361206, + "eval_runtime": 526.2485, + "eval_samples_per_second": 14.516, + "eval_wer": 0.3227364990422825, + "step": 73880 + }, + { + "epoch": 10.93, + "learning_rate": 4.5534124629080125e-06, + "loss": 0.9562, + "step": 73920 + }, + { + "epoch": 10.93, + "eval_loss": 0.8731803894042969, + "eval_runtime": 525.2919, + "eval_samples_per_second": 14.542, + "eval_wer": 0.32096400697561395, + "step": 73920 + }, + { + "epoch": 10.93, + "learning_rate": 4.550445103857567e-06, + "loss": 0.9035, + "step": 73960 + }, + { + "epoch": 10.93, + "eval_loss": 0.8698758482933044, + "eval_runtime": 526.1817, + "eval_samples_per_second": 14.518, + "eval_wer": 0.3207638869035707, + "step": 73960 + }, + { + "epoch": 10.94, + "learning_rate": 4.547477744807122e-06, + "loss": 1.0354, + "step": 74000 + }, + { + "epoch": 10.94, + "eval_loss": 0.8353917598724365, + "eval_runtime": 525.614, + "eval_samples_per_second": 14.533, + "eval_wer": 0.31864833185625663, + "step": 74000 + }, + { + "epoch": 10.94, + "learning_rate": 4.544510385756677e-06, + "loss": 0.9191, + "step": 74040 + }, + { + "epoch": 10.94, + "eval_loss": 0.8867946863174438, + "eval_runtime": 525.4632, + "eval_samples_per_second": 14.538, + "eval_wer": 0.32250779038851884, + "step": 74040 + }, + { + "epoch": 10.95, + "learning_rate": 4.541543026706232e-06, + "loss": 0.995, + "step": 74080 + }, + { + "epoch": 10.95, + "eval_loss": 0.8792908191680908, + "eval_runtime": 523.8417, + "eval_samples_per_second": 14.583, + "eval_wer": 0.32176448726378687, + "step": 74080 + }, + { + "epoch": 10.96, + "learning_rate": 4.5385756676557864e-06, + "loss": 0.9945, + "step": 74120 + }, + { + "epoch": 10.96, + "eval_loss": 0.8628720641136169, + "eval_runtime": 526.036, + "eval_samples_per_second": 14.522, + "eval_wer": 0.3208496526487321, + "step": 74120 + }, + { + "epoch": 10.96, + "learning_rate": 4.535608308605342e-06, + "loss": 1.0121, + "step": 74160 + }, + { + "epoch": 10.96, + "eval_loss": 0.892354428768158, + "eval_runtime": 526.2185, + "eval_samples_per_second": 14.517, + "eval_wer": 0.32290803053260525, + "step": 74160 + }, + { + "epoch": 10.97, + "learning_rate": 4.532640949554897e-06, + "loss": 0.9101, + "step": 74200 + }, + { + "epoch": 10.97, + "eval_loss": 0.906641960144043, + "eval_runtime": 525.4095, + "eval_samples_per_second": 14.539, + "eval_wer": 0.32453757969067154, + "step": 74200 + }, + { + "epoch": 10.97, + "learning_rate": 4.5296735905044515e-06, + "loss": 1.0146, + "step": 74240 + }, + { + "epoch": 10.97, + "eval_loss": 0.8744897842407227, + "eval_runtime": 526.3374, + "eval_samples_per_second": 14.514, + "eval_wer": 0.32173589868206637, + "step": 74240 + }, + { + "epoch": 10.98, + "learning_rate": 4.526706231454006e-06, + "loss": 0.9507, + "step": 74280 + }, + { + "epoch": 10.98, + "eval_loss": 0.8952358961105347, + "eval_runtime": 525.5129, + "eval_samples_per_second": 14.536, + "eval_wer": 0.32393721947454185, + "step": 74280 + }, + { + "epoch": 10.99, + "learning_rate": 4.523738872403561e-06, + "loss": 1.0102, + "step": 74320 + }, + { + "epoch": 10.99, + "eval_loss": 0.8603987097740173, + "eval_runtime": 525.281, + "eval_samples_per_second": 14.543, + "eval_wer": 0.32110694988421623, + "step": 74320 + }, + { + "epoch": 10.99, + "learning_rate": 4.520771513353116e-06, + "loss": 0.8952, + "step": 74360 + }, + { + "epoch": 10.99, + "eval_loss": 0.8740472197532654, + "eval_runtime": 526.6935, + "eval_samples_per_second": 14.504, + "eval_wer": 0.3215071900283027, + "step": 74360 + }, + { + "epoch": 11.0, + "learning_rate": 4.517804154302671e-06, + "loss": 1.0285, + "step": 74400 + }, + { + "epoch": 11.0, + "eval_loss": 0.8457785248756409, + "eval_runtime": 526.1276, + "eval_samples_per_second": 14.519, + "eval_wer": 0.31976328654335456, + "step": 74400 + }, + { + "epoch": 11.0, + "learning_rate": 4.514836795252226e-06, + "loss": 0.9734, + "step": 74440 + }, + { + "epoch": 11.0, + "eval_loss": 0.8885073065757751, + "eval_runtime": 521.0012, + "eval_samples_per_second": 14.662, + "eval_wer": 0.32250779038851884, + "step": 74440 + }, + { + "epoch": 11.01, + "learning_rate": 4.511869436201781e-06, + "loss": 0.9128, + "step": 74480 + }, + { + "epoch": 11.01, + "eval_loss": 0.8826667666435242, + "eval_runtime": 523.726, + "eval_samples_per_second": 14.586, + "eval_wer": 0.3218788415906687, + "step": 74480 + }, + { + "epoch": 11.02, + "learning_rate": 4.508902077151336e-06, + "loss": 0.9021, + "step": 74520 + }, + { + "epoch": 11.02, + "eval_loss": 0.8978096842765808, + "eval_runtime": 523.2864, + "eval_samples_per_second": 14.598, + "eval_wer": 0.32336544784013266, + "step": 74520 + }, + { + "epoch": 11.02, + "learning_rate": 4.50593471810089e-06, + "loss": 0.9032, + "step": 74560 + }, + { + "epoch": 11.02, + "eval_loss": 0.8780806660652161, + "eval_runtime": 524.4218, + "eval_samples_per_second": 14.567, + "eval_wer": 0.3228222647874439, + "step": 74560 + }, + { + "epoch": 11.03, + "learning_rate": 4.502967359050445e-06, + "loss": 0.9704, + "step": 74600 + }, + { + "epoch": 11.03, + "eval_loss": 0.8668006062507629, + "eval_runtime": 524.323, + "eval_samples_per_second": 14.569, + "eval_wer": 0.32182166442722776, + "step": 74600 + }, + { + "epoch": 11.03, + "learning_rate": 4.5e-06, + "loss": 0.9952, + "step": 74640 + }, + { + "epoch": 11.03, + "eval_loss": 0.8721791505813599, + "eval_runtime": 523.6147, + "eval_samples_per_second": 14.589, + "eval_wer": 0.3224506132250779, + "step": 74640 + }, + { + "epoch": 11.04, + "learning_rate": 4.497032640949555e-06, + "loss": 0.9568, + "step": 74680 + }, + { + "epoch": 11.04, + "eval_loss": 0.8970568776130676, + "eval_runtime": 522.9607, + "eval_samples_per_second": 14.607, + "eval_wer": 0.32359415649389633, + "step": 74680 + }, + { + "epoch": 11.05, + "learning_rate": 4.494065281899111e-06, + "loss": 0.8775, + "step": 74720 + }, + { + "epoch": 11.05, + "eval_loss": 0.9438607692718506, + "eval_runtime": 523.5648, + "eval_samples_per_second": 14.59, + "eval_wer": 0.32862574687669743, + "step": 74720 + }, + { + "epoch": 11.05, + "learning_rate": 4.491097922848665e-06, + "loss": 0.9661, + "step": 74760 + }, + { + "epoch": 11.05, + "eval_loss": 0.9346503615379333, + "eval_runtime": 522.7263, + "eval_samples_per_second": 14.614, + "eval_wer": 0.32782526658852457, + "step": 74760 + }, + { + "epoch": 11.06, + "learning_rate": 4.4881305637982196e-06, + "loss": 0.9692, + "step": 74800 + }, + { + "epoch": 11.06, + "eval_loss": 0.8514189124107361, + "eval_runtime": 523.1053, + "eval_samples_per_second": 14.603, + "eval_wer": 0.3209925955573344, + "step": 74800 + }, + { + "epoch": 11.06, + "learning_rate": 4.485163204747775e-06, + "loss": 0.9424, + "step": 74840 + }, + { + "epoch": 11.06, + "eval_loss": 0.8838129043579102, + "eval_runtime": 525.5234, + "eval_samples_per_second": 14.536, + "eval_wer": 0.322393436061637, + "step": 74840 + }, + { + "epoch": 11.07, + "learning_rate": 4.482195845697329e-06, + "loss": 1.0194, + "step": 74880 + }, + { + "epoch": 11.07, + "eval_loss": 0.875468909740448, + "eval_runtime": 522.6881, + "eval_samples_per_second": 14.615, + "eval_wer": 0.32225049315303467, + "step": 74880 + }, + { + "epoch": 11.07, + "learning_rate": 4.479228486646885e-06, + "loss": 0.9779, + "step": 74920 + }, + { + "epoch": 11.07, + "eval_loss": 0.8767786622047424, + "eval_runtime": 524.5456, + "eval_samples_per_second": 14.563, + "eval_wer": 0.32130706995625946, + "step": 74920 + }, + { + "epoch": 11.08, + "learning_rate": 4.47626112759644e-06, + "loss": 0.9414, + "step": 74960 + }, + { + "epoch": 11.08, + "eval_loss": 0.8720973134040833, + "eval_runtime": 522.9051, + "eval_samples_per_second": 14.609, + "eval_wer": 0.32073529832185027, + "step": 74960 + }, + { + "epoch": 11.09, + "learning_rate": 4.473293768545994e-06, + "loss": 0.8873, + "step": 75000 + }, + { + "epoch": 11.09, + "eval_loss": 0.875963032245636, + "eval_runtime": 528.4531, + "eval_samples_per_second": 14.455, + "eval_wer": 0.3203350581777638, + "step": 75000 + }, + { + "epoch": 11.09, + "learning_rate": 4.47032640949555e-06, + "loss": 1.0264, + "step": 75040 + }, + { + "epoch": 11.09, + "eval_loss": 0.8486378788948059, + "eval_runtime": 524.5217, + "eval_samples_per_second": 14.564, + "eval_wer": 0.31993481803367735, + "step": 75040 + }, + { + "epoch": 11.1, + "learning_rate": 4.467359050445104e-06, + "loss": 0.9439, + "step": 75080 + }, + { + "epoch": 11.1, + "eval_loss": 0.8814006447792053, + "eval_runtime": 523.1588, + "eval_samples_per_second": 14.602, + "eval_wer": 0.32087824123045255, + "step": 75080 + }, + { + "epoch": 11.1, + "learning_rate": 4.4643916913946585e-06, + "loss": 0.9525, + "step": 75120 + }, + { + "epoch": 11.1, + "eval_loss": 0.8579049706459045, + "eval_runtime": 523.1109, + "eval_samples_per_second": 14.603, + "eval_wer": 0.3195345778895909, + "step": 75120 + }, + { + "epoch": 11.11, + "learning_rate": 4.461424332344214e-06, + "loss": 0.9222, + "step": 75160 + }, + { + "epoch": 11.11, + "eval_loss": 0.8688095211982727, + "eval_runtime": 522.0458, + "eval_samples_per_second": 14.633, + "eval_wer": 0.3200491723605592, + "step": 75160 + }, + { + "epoch": 11.12, + "learning_rate": 4.458456973293769e-06, + "loss": 1.0064, + "step": 75200 + }, + { + "epoch": 11.12, + "eval_loss": 0.8521592020988464, + "eval_runtime": 524.3019, + "eval_samples_per_second": 14.57, + "eval_wer": 0.3192201034906658, + "step": 75200 + }, + { + "epoch": 11.12, + "learning_rate": 4.455489614243324e-06, + "loss": 1.015, + "step": 75240 + }, + { + "epoch": 11.12, + "eval_loss": 0.8656142950057983, + "eval_runtime": 523.4487, + "eval_samples_per_second": 14.594, + "eval_wer": 0.3203350581777638, + "step": 75240 + }, + { + "epoch": 11.13, + "learning_rate": 4.452522255192879e-06, + "loss": 0.9538, + "step": 75280 + }, + { + "epoch": 11.13, + "eval_loss": 0.8780498504638672, + "eval_runtime": 523.4789, + "eval_samples_per_second": 14.593, + "eval_wer": 0.32073529832185027, + "step": 75280 + }, + { + "epoch": 11.13, + "learning_rate": 4.449554896142433e-06, + "loss": 0.9829, + "step": 75320 + }, + { + "epoch": 11.13, + "eval_loss": 0.8492316007614136, + "eval_runtime": 523.9296, + "eval_samples_per_second": 14.58, + "eval_wer": 0.31970610937991367, + "step": 75320 + }, + { + "epoch": 11.14, + "learning_rate": 4.4465875370919885e-06, + "loss": 0.9522, + "step": 75360 + }, + { + "epoch": 11.14, + "eval_loss": 0.8852068185806274, + "eval_runtime": 524.2386, + "eval_samples_per_second": 14.572, + "eval_wer": 0.32122130421109807, + "step": 75360 + }, + { + "epoch": 11.15, + "learning_rate": 4.443620178041543e-06, + "loss": 1.0412, + "step": 75400 + }, + { + "epoch": 11.15, + "eval_loss": 0.847435712814331, + "eval_runtime": 524.6081, + "eval_samples_per_second": 14.561, + "eval_wer": 0.31907716058206353, + "step": 75400 + }, + { + "epoch": 11.15, + "learning_rate": 4.440652818991098e-06, + "loss": 1.0201, + "step": 75440 + }, + { + "epoch": 11.15, + "eval_loss": 0.8226905465126038, + "eval_runtime": 523.5105, + "eval_samples_per_second": 14.592, + "eval_wer": 0.3180765602218474, + "step": 75440 + }, + { + "epoch": 11.16, + "learning_rate": 4.4376854599406536e-06, + "loss": 0.9351, + "step": 75480 + }, + { + "epoch": 11.16, + "eval_loss": 0.8551357388496399, + "eval_runtime": 521.7265, + "eval_samples_per_second": 14.642, + "eval_wer": 0.3190199834186226, + "step": 75480 + }, + { + "epoch": 11.16, + "learning_rate": 4.434718100890208e-06, + "loss": 0.9727, + "step": 75520 + }, + { + "epoch": 11.16, + "eval_loss": 0.8358757495880127, + "eval_runtime": 523.8655, + "eval_samples_per_second": 14.582, + "eval_wer": 0.31833385745733156, + "step": 75520 + }, + { + "epoch": 11.17, + "learning_rate": 4.431750741839763e-06, + "loss": 0.974, + "step": 75560 + }, + { + "epoch": 11.17, + "eval_loss": 0.8249419331550598, + "eval_runtime": 522.4274, + "eval_samples_per_second": 14.622, + "eval_wer": 0.3181623259670088, + "step": 75560 + }, + { + "epoch": 11.18, + "learning_rate": 4.428783382789318e-06, + "loss": 0.9907, + "step": 75600 + }, + { + "epoch": 11.18, + "eval_loss": 0.8717795610427856, + "eval_runtime": 523.6648, + "eval_samples_per_second": 14.588, + "eval_wer": 0.3203350581777638, + "step": 75600 + }, + { + "epoch": 11.18, + "learning_rate": 4.425816023738872e-06, + "loss": 0.8836, + "step": 75640 + }, + { + "epoch": 11.18, + "eval_loss": 0.8697574734687805, + "eval_runtime": 522.0614, + "eval_samples_per_second": 14.632, + "eval_wer": 0.32079247548529116, + "step": 75640 + }, + { + "epoch": 11.19, + "learning_rate": 4.4228486646884275e-06, + "loss": 1.1145, + "step": 75680 + }, + { + "epoch": 11.19, + "eval_loss": 0.8500919938087463, + "eval_runtime": 523.5363, + "eval_samples_per_second": 14.591, + "eval_wer": 0.319105749163784, + "step": 75680 + }, + { + "epoch": 11.19, + "learning_rate": 4.419881305637983e-06, + "loss": 0.9274, + "step": 75720 + }, + { + "epoch": 11.19, + "eval_loss": 0.8455411791801453, + "eval_runtime": 524.0247, + "eval_samples_per_second": 14.578, + "eval_wer": 0.31876268618313847, + "step": 75720 + }, + { + "epoch": 11.2, + "learning_rate": 4.416913946587538e-06, + "loss": 0.9664, + "step": 75760 + }, + { + "epoch": 11.2, + "eval_loss": 0.852229654788971, + "eval_runtime": 523.6824, + "eval_samples_per_second": 14.587, + "eval_wer": 0.3186769204379771, + "step": 75760 + }, + { + "epoch": 11.2, + "learning_rate": 4.4139465875370925e-06, + "loss": 0.989, + "step": 75800 + }, + { + "epoch": 11.2, + "eval_loss": 0.8532190322875977, + "eval_runtime": 524.3885, + "eval_samples_per_second": 14.567, + "eval_wer": 0.3189628062551817, + "step": 75800 + }, + { + "epoch": 11.21, + "learning_rate": 4.410979228486647e-06, + "loss": 1.0197, + "step": 75840 + }, + { + "epoch": 11.21, + "eval_loss": 0.8395006060600281, + "eval_runtime": 526.2888, + "eval_samples_per_second": 14.515, + "eval_wer": 0.31833385745733156, + "step": 75840 + }, + { + "epoch": 11.22, + "learning_rate": 4.408011869436202e-06, + "loss": 0.8914, + "step": 75880 + }, + { + "epoch": 11.22, + "eval_loss": 0.8726134300231934, + "eval_runtime": 525.165, + "eval_samples_per_second": 14.546, + "eval_wer": 0.3205637668315275, + "step": 75880 + }, + { + "epoch": 11.22, + "learning_rate": 4.405044510385757e-06, + "loss": 0.9613, + "step": 75920 + }, + { + "epoch": 11.22, + "eval_loss": 0.8647737503051758, + "eval_runtime": 522.6925, + "eval_samples_per_second": 14.615, + "eval_wer": 0.320906829812173, + "step": 75920 + }, + { + "epoch": 11.23, + "learning_rate": 4.402077151335312e-06, + "loss": 1.0091, + "step": 75960 + }, + { + "epoch": 11.23, + "eval_loss": 0.8674173355102539, + "eval_runtime": 525.0311, + "eval_samples_per_second": 14.55, + "eval_wer": 0.3206495325766889, + "step": 75960 + }, + { + "epoch": 11.23, + "learning_rate": 4.399109792284867e-06, + "loss": 0.9536, + "step": 76000 + }, + { + "epoch": 11.23, + "eval_loss": 0.8850842714309692, + "eval_runtime": 523.4306, + "eval_samples_per_second": 14.594, + "eval_wer": 0.32113553846593673, + "step": 76000 + }, + { + "epoch": 11.24, + "learning_rate": 4.396142433234422e-06, + "loss": 0.89, + "step": 76040 + }, + { + "epoch": 11.24, + "eval_loss": 0.891082227230072, + "eval_runtime": 524.0262, + "eval_samples_per_second": 14.578, + "eval_wer": 0.3215071900283027, + "step": 76040 + }, + { + "epoch": 11.25, + "learning_rate": 4.393175074183977e-06, + "loss": 1.0062, + "step": 76080 + }, + { + "epoch": 11.25, + "eval_loss": 0.8741889595985413, + "eval_runtime": 523.0906, + "eval_samples_per_second": 14.604, + "eval_wer": 0.3202492924326024, + "step": 76080 + }, + { + "epoch": 11.25, + "learning_rate": 4.390207715133531e-06, + "loss": 0.9512, + "step": 76120 + }, + { + "epoch": 11.25, + "eval_loss": 0.8631335496902466, + "eval_runtime": 523.0758, + "eval_samples_per_second": 14.604, + "eval_wer": 0.32007776094227963, + "step": 76120 + }, + { + "epoch": 11.26, + "learning_rate": 4.387240356083086e-06, + "loss": 0.9638, + "step": 76160 + }, + { + "epoch": 11.26, + "eval_loss": 0.8634206056594849, + "eval_runtime": 524.3463, + "eval_samples_per_second": 14.569, + "eval_wer": 0.32062094399496843, + "step": 76160 + }, + { + "epoch": 11.26, + "learning_rate": 4.384272997032641e-06, + "loss": 0.9005, + "step": 76200 + }, + { + "epoch": 11.26, + "eval_loss": 0.9086675643920898, + "eval_runtime": 528.5838, + "eval_samples_per_second": 14.452, + "eval_wer": 0.3240515738014237, + "step": 76200 + }, + { + "epoch": 11.27, + "learning_rate": 4.3813056379821964e-06, + "loss": 1.0394, + "step": 76240 + }, + { + "epoch": 11.27, + "eval_loss": 0.8832709193229675, + "eval_runtime": 523.2408, + "eval_samples_per_second": 14.599, + "eval_wer": 0.3218502530089482, + "step": 76240 + }, + { + "epoch": 11.28, + "learning_rate": 4.378338278931752e-06, + "loss": 0.968, + "step": 76280 + }, + { + "epoch": 11.28, + "eval_loss": 0.8536676168441772, + "eval_runtime": 525.0184, + "eval_samples_per_second": 14.55, + "eval_wer": 0.31993481803367735, + "step": 76280 + }, + { + "epoch": 11.28, + "learning_rate": 4.375370919881306e-06, + "loss": 0.8996, + "step": 76320 + }, + { + "epoch": 11.28, + "eval_loss": 0.8971124887466431, + "eval_runtime": 523.9537, + "eval_samples_per_second": 14.58, + "eval_wer": 0.3227364990422825, + "step": 76320 + }, + { + "epoch": 11.29, + "learning_rate": 4.372403560830861e-06, + "loss": 0.9724, + "step": 76360 + }, + { + "epoch": 11.29, + "eval_loss": 0.9403702020645142, + "eval_runtime": 524.5224, + "eval_samples_per_second": 14.564, + "eval_wer": 0.3276823236799222, + "step": 76360 + }, + { + "epoch": 11.29, + "learning_rate": 4.369436201780416e-06, + "loss": 0.9281, + "step": 76400 + }, + { + "epoch": 11.29, + "eval_loss": 0.8814358115196228, + "eval_runtime": 524.3808, + "eval_samples_per_second": 14.568, + "eval_wer": 0.32213613882615283, + "step": 76400 + }, + { + "epoch": 11.3, + "learning_rate": 4.36646884272997e-06, + "loss": 0.9009, + "step": 76440 + }, + { + "epoch": 11.3, + "eval_loss": 0.9166126847267151, + "eval_runtime": 522.9804, + "eval_samples_per_second": 14.607, + "eval_wer": 0.32585265444981276, + "step": 76440 + }, + { + "epoch": 11.31, + "learning_rate": 4.363501483679526e-06, + "loss": 0.9202, + "step": 76480 + }, + { + "epoch": 11.31, + "eval_loss": 0.895381510257721, + "eval_runtime": 527.5508, + "eval_samples_per_second": 14.48, + "eval_wer": 0.3239943966379828, + "step": 76480 + }, + { + "epoch": 11.31, + "learning_rate": 4.360534124629081e-06, + "loss": 0.8901, + "step": 76520 + }, + { + "epoch": 11.31, + "eval_loss": 0.8956805467605591, + "eval_runtime": 523.3535, + "eval_samples_per_second": 14.596, + "eval_wer": 0.32345121358529405, + "step": 76520 + }, + { + "epoch": 11.32, + "learning_rate": 4.357566765578635e-06, + "loss": 1.115, + "step": 76560 + }, + { + "epoch": 11.32, + "eval_loss": 0.8780887126922607, + "eval_runtime": 523.5987, + "eval_samples_per_second": 14.589, + "eval_wer": 0.32205037308099144, + "step": 76560 + }, + { + "epoch": 11.32, + "learning_rate": 4.354599406528191e-06, + "loss": 0.9533, + "step": 76600 + }, + { + "epoch": 11.32, + "eval_loss": 0.8578474521636963, + "eval_runtime": 525.2436, + "eval_samples_per_second": 14.544, + "eval_wer": 0.3200491723605592, + "step": 76600 + }, + { + "epoch": 11.33, + "learning_rate": 4.351632047477745e-06, + "loss": 1.0046, + "step": 76640 + }, + { + "epoch": 11.33, + "eval_loss": 0.8688116073608398, + "eval_runtime": 524.354, + "eval_samples_per_second": 14.568, + "eval_wer": 0.32102118413905484, + "step": 76640 + }, + { + "epoch": 11.33, + "learning_rate": 4.3486646884272995e-06, + "loss": 1.0077, + "step": 76680 + }, + { + "epoch": 11.33, + "eval_loss": 0.8444474339485168, + "eval_runtime": 523.2439, + "eval_samples_per_second": 14.599, + "eval_wer": 0.3194488121444295, + "step": 76680 + }, + { + "epoch": 11.34, + "learning_rate": 4.345697329376855e-06, + "loss": 0.9173, + "step": 76720 + }, + { + "epoch": 11.34, + "eval_loss": 0.8727929592132568, + "eval_runtime": 524.1524, + "eval_samples_per_second": 14.574, + "eval_wer": 0.32196460733583004, + "step": 76720 + }, + { + "epoch": 11.35, + "learning_rate": 4.34272997032641e-06, + "loss": 0.9061, + "step": 76760 + }, + { + "epoch": 11.35, + "eval_loss": 0.8930858373641968, + "eval_runtime": 526.0488, + "eval_samples_per_second": 14.521, + "eval_wer": 0.32342262500357355, + "step": 76760 + }, + { + "epoch": 11.35, + "learning_rate": 4.339762611275965e-06, + "loss": 0.955, + "step": 76800 + }, + { + "epoch": 11.35, + "eval_loss": 0.8974524736404419, + "eval_runtime": 524.545, + "eval_samples_per_second": 14.563, + "eval_wer": 0.32439463678206926, + "step": 76800 + }, + { + "epoch": 11.36, + "learning_rate": 4.33679525222552e-06, + "loss": 0.8996, + "step": 76840 + }, + { + "epoch": 11.36, + "eval_loss": 0.886813759803772, + "eval_runtime": 524.7226, + "eval_samples_per_second": 14.558, + "eval_wer": 0.32299379627776664, + "step": 76840 + }, + { + "epoch": 11.36, + "learning_rate": 4.333827893175074e-06, + "loss": 0.8936, + "step": 76880 + }, + { + "epoch": 11.36, + "eval_loss": 0.8785150051116943, + "eval_runtime": 523.9155, + "eval_samples_per_second": 14.581, + "eval_wer": 0.32182166442722776, + "step": 76880 + }, + { + "epoch": 11.37, + "learning_rate": 4.3308605341246296e-06, + "loss": 0.9426, + "step": 76920 + }, + { + "epoch": 11.37, + "eval_loss": 0.9065107107162476, + "eval_runtime": 522.6069, + "eval_samples_per_second": 14.617, + "eval_wer": 0.3241373395465851, + "step": 76920 + }, + { + "epoch": 11.38, + "learning_rate": 4.327893175074184e-06, + "loss": 0.9455, + "step": 76960 + }, + { + "epoch": 11.38, + "eval_loss": 0.9122452139854431, + "eval_runtime": 523.7386, + "eval_samples_per_second": 14.586, + "eval_wer": 0.32422310529174647, + "step": 76960 + }, + { + "epoch": 11.38, + "learning_rate": 4.324925816023739e-06, + "loss": 0.9073, + "step": 77000 + }, + { + "epoch": 11.38, + "eval_loss": 0.9343478679656982, + "eval_runtime": 522.2082, + "eval_samples_per_second": 14.628, + "eval_wer": 0.3269104319734698, + "step": 77000 + }, + { + "epoch": 11.39, + "learning_rate": 4.321958456973295e-06, + "loss": 0.9308, + "step": 77040 + }, + { + "epoch": 11.39, + "eval_loss": 0.8989158868789673, + "eval_runtime": 523.7672, + "eval_samples_per_second": 14.585, + "eval_wer": 0.3233368592584122, + "step": 77040 + }, + { + "epoch": 11.39, + "learning_rate": 4.318991097922849e-06, + "loss": 0.9588, + "step": 77080 + }, + { + "epoch": 11.39, + "eval_loss": 0.8802681565284729, + "eval_runtime": 524.0746, + "eval_samples_per_second": 14.576, + "eval_wer": 0.32213613882615283, + "step": 77080 + }, + { + "epoch": 11.4, + "learning_rate": 4.316023738872404e-06, + "loss": 1.0319, + "step": 77120 + }, + { + "epoch": 11.4, + "eval_loss": 0.8505075573921204, + "eval_runtime": 522.9141, + "eval_samples_per_second": 14.609, + "eval_wer": 0.32030646959604336, + "step": 77120 + }, + { + "epoch": 11.41, + "learning_rate": 4.313056379821959e-06, + "loss": 0.9344, + "step": 77160 + }, + { + "epoch": 11.41, + "eval_loss": 0.8615293502807617, + "eval_runtime": 523.2544, + "eval_samples_per_second": 14.599, + "eval_wer": 0.3209354183938935, + "step": 77160 + }, + { + "epoch": 11.41, + "learning_rate": 4.310089020771513e-06, + "loss": 0.9243, + "step": 77200 + }, + { + "epoch": 11.41, + "eval_loss": 0.8459999561309814, + "eval_runtime": 524.1513, + "eval_samples_per_second": 14.574, + "eval_wer": 0.32007776094227963, + "step": 77200 + }, + { + "epoch": 11.42, + "learning_rate": 4.3071216617210685e-06, + "loss": 0.9294, + "step": 77240 + }, + { + "epoch": 11.42, + "eval_loss": 0.8874210715293884, + "eval_runtime": 523.7735, + "eval_samples_per_second": 14.585, + "eval_wer": 0.3231081506046485, + "step": 77240 + }, + { + "epoch": 11.42, + "learning_rate": 4.304154302670624e-06, + "loss": 1.0119, + "step": 77280 + }, + { + "epoch": 11.42, + "eval_loss": 0.8766046166419983, + "eval_runtime": 524.3628, + "eval_samples_per_second": 14.568, + "eval_wer": 0.3217930758455073, + "step": 77280 + }, + { + "epoch": 11.43, + "learning_rate": 4.301186943620178e-06, + "loss": 0.9534, + "step": 77320 + }, + { + "epoch": 11.43, + "eval_loss": 0.8699072599411011, + "eval_runtime": 523.0869, + "eval_samples_per_second": 14.604, + "eval_wer": 0.32030646959604336, + "step": 77320 + }, + { + "epoch": 11.44, + "learning_rate": 4.2982195845697335e-06, + "loss": 1.0033, + "step": 77360 + }, + { + "epoch": 11.44, + "eval_loss": 0.8639472723007202, + "eval_runtime": 523.334, + "eval_samples_per_second": 14.597, + "eval_wer": 0.3199919951971183, + "step": 77360 + }, + { + "epoch": 11.44, + "learning_rate": 4.295252225519288e-06, + "loss": 0.9606, + "step": 77400 + }, + { + "epoch": 11.44, + "eval_loss": 0.8748189806938171, + "eval_runtime": 523.2482, + "eval_samples_per_second": 14.599, + "eval_wer": 0.32122130421109807, + "step": 77400 + }, + { + "epoch": 11.45, + "learning_rate": 4.292284866468843e-06, + "loss": 0.9678, + "step": 77440 + }, + { + "epoch": 11.45, + "eval_loss": 0.8936617970466614, + "eval_runtime": 524.2576, + "eval_samples_per_second": 14.571, + "eval_wer": 0.32350839074873494, + "step": 77440 + }, + { + "epoch": 11.45, + "learning_rate": 4.289317507418398e-06, + "loss": 0.9214, + "step": 77480 + }, + { + "epoch": 11.45, + "eval_loss": 0.8708622455596924, + "eval_runtime": 522.8483, + "eval_samples_per_second": 14.61, + "eval_wer": 0.321278481374539, + "step": 77480 + }, + { + "epoch": 11.46, + "learning_rate": 4.286350148367953e-06, + "loss": 0.9211, + "step": 77520 + }, + { + "epoch": 11.46, + "eval_loss": 0.8749785423278809, + "eval_runtime": 522.694, + "eval_samples_per_second": 14.615, + "eval_wer": 0.320906829812173, + "step": 77520 + }, + { + "epoch": 11.46, + "learning_rate": 4.283382789317508e-06, + "loss": 0.9633, + "step": 77560 + }, + { + "epoch": 11.46, + "eval_loss": 0.87513267993927, + "eval_runtime": 526.6172, + "eval_samples_per_second": 14.506, + "eval_wer": 0.32059235541324793, + "step": 77560 + }, + { + "epoch": 11.47, + "learning_rate": 4.280415430267063e-06, + "loss": 0.9769, + "step": 77600 + }, + { + "epoch": 11.47, + "eval_loss": 0.8771241903305054, + "eval_runtime": 522.5194, + "eval_samples_per_second": 14.62, + "eval_wer": 0.32082106406701166, + "step": 77600 + }, + { + "epoch": 11.48, + "learning_rate": 4.277448071216618e-06, + "loss": 0.989, + "step": 77640 + }, + { + "epoch": 11.48, + "eval_loss": 0.871545672416687, + "eval_runtime": 523.6561, + "eval_samples_per_second": 14.588, + "eval_wer": 0.32027788101432286, + "step": 77640 + }, + { + "epoch": 11.48, + "learning_rate": 4.2744807121661724e-06, + "loss": 0.9697, + "step": 77680 + }, + { + "epoch": 11.48, + "eval_loss": 0.8611247539520264, + "eval_runtime": 524.9941, + "eval_samples_per_second": 14.551, + "eval_wer": 0.3198776408702364, + "step": 77680 + }, + { + "epoch": 11.49, + "learning_rate": 4.271513353115727e-06, + "loss": 0.8575, + "step": 77720 + }, + { + "epoch": 11.49, + "eval_loss": 0.8804584741592407, + "eval_runtime": 523.2061, + "eval_samples_per_second": 14.6, + "eval_wer": 0.32070670974012977, + "step": 77720 + }, + { + "epoch": 11.49, + "learning_rate": 4.268545994065282e-06, + "loss": 0.8743, + "step": 77760 + }, + { + "epoch": 11.49, + "eval_loss": 0.8899778723716736, + "eval_runtime": 524.4697, + "eval_samples_per_second": 14.565, + "eval_wer": 0.320906829812173, + "step": 77760 + }, + { + "epoch": 11.5, + "learning_rate": 4.2655786350148375e-06, + "loss": 0.949, + "step": 77800 + }, + { + "epoch": 11.5, + "eval_loss": 0.8850250244140625, + "eval_runtime": 528.2126, + "eval_samples_per_second": 14.462, + "eval_wer": 0.32102118413905484, + "step": 77800 + }, + { + "epoch": 11.51, + "learning_rate": 4.262611275964392e-06, + "loss": 0.9141, + "step": 77840 + }, + { + "epoch": 11.51, + "eval_loss": 0.8829900622367859, + "eval_runtime": 524.6703, + "eval_samples_per_second": 14.56, + "eval_wer": 0.32059235541324793, + "step": 77840 + }, + { + "epoch": 11.51, + "learning_rate": 4.259643916913947e-06, + "loss": 0.9699, + "step": 77880 + }, + { + "epoch": 11.51, + "eval_loss": 0.8973756432533264, + "eval_runtime": 522.9205, + "eval_samples_per_second": 14.608, + "eval_wer": 0.32213613882615283, + "step": 77880 + }, + { + "epoch": 11.52, + "learning_rate": 4.256676557863502e-06, + "loss": 0.9562, + "step": 77920 + }, + { + "epoch": 11.52, + "eval_loss": 0.8765623569488525, + "eval_runtime": 528.5, + "eval_samples_per_second": 14.454, + "eval_wer": 0.3215929557734641, + "step": 77920 + }, + { + "epoch": 11.52, + "learning_rate": 4.253709198813057e-06, + "loss": 0.9412, + "step": 77960 + }, + { + "epoch": 11.52, + "eval_loss": 0.8962547779083252, + "eval_runtime": 524.3115, + "eval_samples_per_second": 14.57, + "eval_wer": 0.3226221447154007, + "step": 77960 + }, + { + "epoch": 11.53, + "learning_rate": 4.250741839762611e-06, + "loss": 0.9293, + "step": 78000 + }, + { + "epoch": 11.53, + "eval_loss": 0.9454579949378967, + "eval_runtime": 524.5731, + "eval_samples_per_second": 14.562, + "eval_wer": 0.32759655793476083, + "step": 78000 + }, + { + "epoch": 11.54, + "learning_rate": 4.247774480712167e-06, + "loss": 0.9367, + "step": 78040 + }, + { + "epoch": 11.54, + "eval_loss": 0.8851422667503357, + "eval_runtime": 523.0227, + "eval_samples_per_second": 14.605, + "eval_wer": 0.3224506132250779, + "step": 78040 + }, + { + "epoch": 11.54, + "learning_rate": 4.244807121661721e-06, + "loss": 1.0301, + "step": 78080 + }, + { + "epoch": 11.54, + "eval_loss": 0.8933733701705933, + "eval_runtime": 524.0978, + "eval_samples_per_second": 14.576, + "eval_wer": 0.32302238485948714, + "step": 78080 + }, + { + "epoch": 11.55, + "learning_rate": 4.241839762611276e-06, + "loss": 0.9317, + "step": 78120 + }, + { + "epoch": 11.55, + "eval_loss": 0.8730897307395935, + "eval_runtime": 523.4022, + "eval_samples_per_second": 14.595, + "eval_wer": 0.32087824123045255, + "step": 78120 + }, + { + "epoch": 11.55, + "learning_rate": 4.238872403560832e-06, + "loss": 0.9283, + "step": 78160 + }, + { + "epoch": 11.55, + "eval_loss": 0.8756207823753357, + "eval_runtime": 524.9804, + "eval_samples_per_second": 14.551, + "eval_wer": 0.32139283570142085, + "step": 78160 + }, + { + "epoch": 11.56, + "learning_rate": 4.235905044510386e-06, + "loss": 0.9835, + "step": 78200 + }, + { + "epoch": 11.56, + "eval_loss": 0.8877220153808594, + "eval_runtime": 524.494, + "eval_samples_per_second": 14.565, + "eval_wer": 0.3227079104605621, + "step": 78200 + }, + { + "epoch": 11.57, + "learning_rate": 4.2329376854599405e-06, + "loss": 0.9276, + "step": 78240 + }, + { + "epoch": 11.57, + "eval_loss": 0.8919588923454285, + "eval_runtime": 523.5042, + "eval_samples_per_second": 14.592, + "eval_wer": 0.3227079104605621, + "step": 78240 + }, + { + "epoch": 11.57, + "learning_rate": 4.229970326409496e-06, + "loss": 0.9617, + "step": 78280 + }, + { + "epoch": 11.57, + "eval_loss": 0.8707315325737, + "eval_runtime": 523.8542, + "eval_samples_per_second": 14.582, + "eval_wer": 0.321278481374539, + "step": 78280 + }, + { + "epoch": 11.58, + "learning_rate": 4.22700296735905e-06, + "loss": 0.9541, + "step": 78320 + }, + { + "epoch": 11.58, + "eval_loss": 0.9092928171157837, + "eval_runtime": 524.2347, + "eval_samples_per_second": 14.572, + "eval_wer": 0.32396580805626235, + "step": 78320 + }, + { + "epoch": 11.58, + "learning_rate": 4.2240356083086056e-06, + "loss": 0.9654, + "step": 78360 + }, + { + "epoch": 11.58, + "eval_loss": 0.8945013284683228, + "eval_runtime": 523.8633, + "eval_samples_per_second": 14.582, + "eval_wer": 0.3227936762057234, + "step": 78360 + }, + { + "epoch": 11.59, + "learning_rate": 4.221068249258161e-06, + "loss": 0.9632, + "step": 78400 + }, + { + "epoch": 11.59, + "eval_loss": 0.901579737663269, + "eval_runtime": 524.3805, + "eval_samples_per_second": 14.568, + "eval_wer": 0.32345121358529405, + "step": 78400 + }, + { + "epoch": 11.59, + "learning_rate": 4.218100890207715e-06, + "loss": 0.9379, + "step": 78440 + }, + { + "epoch": 11.59, + "eval_loss": 0.8847746849060059, + "eval_runtime": 523.4166, + "eval_samples_per_second": 14.594, + "eval_wer": 0.32173589868206637, + "step": 78440 + }, + { + "epoch": 11.6, + "learning_rate": 4.215133531157271e-06, + "loss": 0.9561, + "step": 78480 + }, + { + "epoch": 11.6, + "eval_loss": 0.8811178803443909, + "eval_runtime": 524.5003, + "eval_samples_per_second": 14.564, + "eval_wer": 0.3217930758455073, + "step": 78480 + }, + { + "epoch": 11.61, + "learning_rate": 4.212166172106825e-06, + "loss": 0.9463, + "step": 78520 + }, + { + "epoch": 11.61, + "eval_loss": 0.8614893555641174, + "eval_runtime": 524.5689, + "eval_samples_per_second": 14.562, + "eval_wer": 0.32007776094227963, + "step": 78520 + }, + { + "epoch": 11.61, + "learning_rate": 4.2091988130563795e-06, + "loss": 0.906, + "step": 78560 + }, + { + "epoch": 11.61, + "eval_loss": 0.8711714148521423, + "eval_runtime": 523.2597, + "eval_samples_per_second": 14.599, + "eval_wer": 0.32030646959604336, + "step": 78560 + }, + { + "epoch": 11.62, + "learning_rate": 4.206231454005935e-06, + "loss": 0.9266, + "step": 78600 + }, + { + "epoch": 11.62, + "eval_loss": 0.8591979146003723, + "eval_runtime": 524.6556, + "eval_samples_per_second": 14.56, + "eval_wer": 0.31979187512507506, + "step": 78600 + }, + { + "epoch": 11.62, + "learning_rate": 4.20326409495549e-06, + "loss": 0.9511, + "step": 78640 + }, + { + "epoch": 11.62, + "eval_loss": 0.8643084764480591, + "eval_runtime": 525.1113, + "eval_samples_per_second": 14.547, + "eval_wer": 0.32002058377883874, + "step": 78640 + }, + { + "epoch": 11.63, + "learning_rate": 4.200296735905045e-06, + "loss": 1.0736, + "step": 78680 + }, + { + "epoch": 11.63, + "eval_loss": 0.8239288330078125, + "eval_runtime": 523.1442, + "eval_samples_per_second": 14.602, + "eval_wer": 0.3181909145487292, + "step": 78680 + }, + { + "epoch": 11.64, + "learning_rate": 4.1973293768546e-06, + "loss": 0.9225, + "step": 78720 + }, + { + "epoch": 11.64, + "eval_loss": 0.8282068371772766, + "eval_runtime": 523.7728, + "eval_samples_per_second": 14.585, + "eval_wer": 0.31781926298636326, + "step": 78720 + }, + { + "epoch": 11.64, + "learning_rate": 4.194362017804154e-06, + "loss": 0.9785, + "step": 78760 + }, + { + "epoch": 11.64, + "eval_loss": 0.8568938970565796, + "eval_runtime": 523.0885, + "eval_samples_per_second": 14.604, + "eval_wer": 0.3195345778895909, + "step": 78760 + }, + { + "epoch": 11.65, + "learning_rate": 4.1913946587537095e-06, + "loss": 0.949, + "step": 78800 + }, + { + "epoch": 11.65, + "eval_loss": 0.8848423361778259, + "eval_runtime": 523.5804, + "eval_samples_per_second": 14.59, + "eval_wer": 0.3209354183938935, + "step": 78800 + }, + { + "epoch": 11.65, + "learning_rate": 4.188427299703264e-06, + "loss": 0.9895, + "step": 78840 + }, + { + "epoch": 11.65, + "eval_loss": 0.8649215698242188, + "eval_runtime": 525.3482, + "eval_samples_per_second": 14.541, + "eval_wer": 0.3201349381057206, + "step": 78840 + }, + { + "epoch": 11.66, + "learning_rate": 4.185459940652819e-06, + "loss": 0.9405, + "step": 78880 + }, + { + "epoch": 11.66, + "eval_loss": 0.8436762094497681, + "eval_runtime": 523.8042, + "eval_samples_per_second": 14.584, + "eval_wer": 0.31839103462077245, + "step": 78880 + }, + { + "epoch": 11.67, + "learning_rate": 4.1824925816023745e-06, + "loss": 0.9537, + "step": 78920 + }, + { + "epoch": 11.67, + "eval_loss": 0.8738733530044556, + "eval_runtime": 524.4679, + "eval_samples_per_second": 14.565, + "eval_wer": 0.32096400697561395, + "step": 78920 + }, + { + "epoch": 11.67, + "learning_rate": 4.179525222551929e-06, + "loss": 0.9896, + "step": 78960 + }, + { + "epoch": 11.67, + "eval_loss": 0.8520752787590027, + "eval_runtime": 526.1636, + "eval_samples_per_second": 14.518, + "eval_wer": 0.31936304639926816, + "step": 78960 + }, + { + "epoch": 11.68, + "learning_rate": 4.176557863501484e-06, + "loss": 0.9161, + "step": 79000 + }, + { + "epoch": 11.68, + "eval_loss": 0.9059736132621765, + "eval_runtime": 525.2929, + "eval_samples_per_second": 14.542, + "eval_wer": 0.3232510935132508, + "step": 79000 + }, + { + "epoch": 11.68, + "learning_rate": 4.173590504451039e-06, + "loss": 1.0051, + "step": 79040 + }, + { + "epoch": 11.68, + "eval_loss": 0.8351567983627319, + "eval_runtime": 524.8517, + "eval_samples_per_second": 14.555, + "eval_wer": 0.3181909145487292, + "step": 79040 + }, + { + "epoch": 11.69, + "learning_rate": 4.170623145400593e-06, + "loss": 0.952, + "step": 79080 + }, + { + "epoch": 11.69, + "eval_loss": 0.8897086381912231, + "eval_runtime": 524.2932, + "eval_samples_per_second": 14.57, + "eval_wer": 0.32176448726378687, + "step": 79080 + }, + { + "epoch": 11.7, + "learning_rate": 4.1676557863501484e-06, + "loss": 0.8746, + "step": 79120 + }, + { + "epoch": 11.7, + "eval_loss": 0.8790468573570251, + "eval_runtime": 523.4436, + "eval_samples_per_second": 14.594, + "eval_wer": 0.32070670974012977, + "step": 79120 + }, + { + "epoch": 11.7, + "learning_rate": 4.164688427299704e-06, + "loss": 0.9755, + "step": 79160 + }, + { + "epoch": 11.7, + "eval_loss": 0.9040760397911072, + "eval_runtime": 524.9438, + "eval_samples_per_second": 14.552, + "eval_wer": 0.32276508762400297, + "step": 79160 + }, + { + "epoch": 11.71, + "learning_rate": 4.161721068249259e-06, + "loss": 1.0606, + "step": 79200 + }, + { + "epoch": 11.71, + "eval_loss": 0.8644907474517822, + "eval_runtime": 524.5851, + "eval_samples_per_second": 14.562, + "eval_wer": 0.3193058692358272, + "step": 79200 + }, + { + "epoch": 11.71, + "learning_rate": 4.1587537091988135e-06, + "loss": 0.8988, + "step": 79240 + }, + { + "epoch": 11.71, + "eval_loss": 0.8876854777336121, + "eval_runtime": 524.446, + "eval_samples_per_second": 14.566, + "eval_wer": 0.32062094399496843, + "step": 79240 + }, + { + "epoch": 11.72, + "learning_rate": 4.155786350148368e-06, + "loss": 0.9494, + "step": 79280 + }, + { + "epoch": 11.72, + "eval_loss": 0.8644449710845947, + "eval_runtime": 524.7641, + "eval_samples_per_second": 14.557, + "eval_wer": 0.3199062294519569, + "step": 79280 + }, + { + "epoch": 11.72, + "learning_rate": 4.152818991097923e-06, + "loss": 0.9646, + "step": 79320 + }, + { + "epoch": 11.72, + "eval_loss": 0.8757545351982117, + "eval_runtime": 524.2592, + "eval_samples_per_second": 14.571, + "eval_wer": 0.3204780010863661, + "step": 79320 + }, + { + "epoch": 11.73, + "learning_rate": 4.149851632047478e-06, + "loss": 0.921, + "step": 79360 + }, + { + "epoch": 11.73, + "eval_loss": 0.9016876816749573, + "eval_runtime": 527.8715, + "eval_samples_per_second": 14.471, + "eval_wer": 0.322393436061637, + "step": 79360 + }, + { + "epoch": 11.74, + "learning_rate": 4.146884272997033e-06, + "loss": 1.0013, + "step": 79400 + }, + { + "epoch": 11.74, + "eval_loss": 0.8564038276672363, + "eval_runtime": 524.8761, + "eval_samples_per_second": 14.554, + "eval_wer": 0.31936304639926816, + "step": 79400 + }, + { + "epoch": 11.74, + "learning_rate": 4.143916913946588e-06, + "loss": 0.9219, + "step": 79440 + }, + { + "epoch": 11.74, + "eval_loss": 0.8412842154502869, + "eval_runtime": 524.4637, + "eval_samples_per_second": 14.565, + "eval_wer": 0.31824809171217017, + "step": 79440 + }, + { + "epoch": 11.75, + "learning_rate": 4.140949554896143e-06, + "loss": 0.9048, + "step": 79480 + }, + { + "epoch": 11.75, + "eval_loss": 0.9077873229980469, + "eval_runtime": 523.8135, + "eval_samples_per_second": 14.583, + "eval_wer": 0.3236513336573373, + "step": 79480 + }, + { + "epoch": 11.75, + "learning_rate": 4.137982195845698e-06, + "loss": 0.978, + "step": 79520 + }, + { + "epoch": 11.75, + "eval_loss": 0.9030499458312988, + "eval_runtime": 523.5486, + "eval_samples_per_second": 14.591, + "eval_wer": 0.3233940364218531, + "step": 79520 + }, + { + "epoch": 11.76, + "learning_rate": 4.135014836795252e-06, + "loss": 1.0114, + "step": 79560 + }, + { + "epoch": 11.76, + "eval_loss": 0.8320261836051941, + "eval_runtime": 523.2138, + "eval_samples_per_second": 14.6, + "eval_wer": 0.3180765602218474, + "step": 79560 + }, + { + "epoch": 11.77, + "learning_rate": 4.132047477744807e-06, + "loss": 0.9727, + "step": 79600 + }, + { + "epoch": 11.77, + "eval_loss": 0.8364858031272888, + "eval_runtime": 524.3394, + "eval_samples_per_second": 14.569, + "eval_wer": 0.3187055090196975, + "step": 79600 + }, + { + "epoch": 11.77, + "learning_rate": 4.129080118694362e-06, + "loss": 0.9462, + "step": 79640 + }, + { + "epoch": 11.77, + "eval_loss": 0.8415073156356812, + "eval_runtime": 525.989, + "eval_samples_per_second": 14.523, + "eval_wer": 0.31876268618313847, + "step": 79640 + }, + { + "epoch": 11.78, + "learning_rate": 4.126112759643917e-06, + "loss": 0.8851, + "step": 79680 + }, + { + "epoch": 11.78, + "eval_loss": 0.8824367523193359, + "eval_runtime": 529.0318, + "eval_samples_per_second": 14.44, + "eval_wer": 0.3209354183938935, + "step": 79680 + }, + { + "epoch": 11.78, + "learning_rate": 4.123145400593473e-06, + "loss": 1.0052, + "step": 79720 + }, + { + "epoch": 11.78, + "eval_loss": 0.8799766302108765, + "eval_runtime": 523.98, + "eval_samples_per_second": 14.579, + "eval_wer": 0.3199919951971183, + "step": 79720 + }, + { + "epoch": 11.79, + "learning_rate": 4.120178041543027e-06, + "loss": 1.0178, + "step": 79760 + }, + { + "epoch": 11.79, + "eval_loss": 0.8128865361213684, + "eval_runtime": 524.0969, + "eval_samples_per_second": 14.576, + "eval_wer": 0.315818062265931, + "step": 79760 + }, + { + "epoch": 11.8, + "learning_rate": 4.1172106824925816e-06, + "loss": 1.0587, + "step": 79800 + }, + { + "epoch": 11.8, + "eval_loss": 0.8359128832817078, + "eval_runtime": 523.2726, + "eval_samples_per_second": 14.599, + "eval_wer": 0.31736184567883585, + "step": 79800 + }, + { + "epoch": 11.8, + "learning_rate": 4.114243323442137e-06, + "loss": 0.8742, + "step": 79840 + }, + { + "epoch": 11.8, + "eval_loss": 0.8834995627403259, + "eval_runtime": 524.657, + "eval_samples_per_second": 14.56, + "eval_wer": 0.3200491723605592, + "step": 79840 + }, + { + "epoch": 11.81, + "learning_rate": 4.111275964391691e-06, + "loss": 0.9656, + "step": 79880 + }, + { + "epoch": 11.81, + "eval_loss": 0.8848907351493835, + "eval_runtime": 524.3395, + "eval_samples_per_second": 14.569, + "eval_wer": 0.31947740072615, + "step": 79880 + }, + { + "epoch": 11.81, + "learning_rate": 4.108308605341247e-06, + "loss": 0.9574, + "step": 79920 + }, + { + "epoch": 11.81, + "eval_loss": 0.8596533536911011, + "eval_runtime": 524.8686, + "eval_samples_per_second": 14.554, + "eval_wer": 0.3180765602218474, + "step": 79920 + }, + { + "epoch": 11.82, + "learning_rate": 4.105341246290802e-06, + "loss": 0.9563, + "step": 79960 + }, + { + "epoch": 11.82, + "eval_loss": 0.8504166603088379, + "eval_runtime": 525.2001, + "eval_samples_per_second": 14.545, + "eval_wer": 0.3180765602218474, + "step": 79960 + }, + { + "epoch": 11.83, + "learning_rate": 4.102373887240356e-06, + "loss": 0.961, + "step": 80000 + }, + { + "epoch": 11.83, + "eval_loss": 0.8558455109596252, + "eval_runtime": 523.5012, + "eval_samples_per_second": 14.592, + "eval_wer": 0.3179336173132451, + "step": 80000 + }, + { + "epoch": 11.83, + "learning_rate": 4.099406528189912e-06, + "loss": 0.9862, + "step": 80040 + }, + { + "epoch": 11.83, + "eval_loss": 0.8296683430671692, + "eval_runtime": 523.5091, + "eval_samples_per_second": 14.592, + "eval_wer": 0.3167614854627062, + "step": 80040 + }, + { + "epoch": 11.84, + "learning_rate": 4.096439169139466e-06, + "loss": 0.8801, + "step": 80080 + }, + { + "epoch": 11.84, + "eval_loss": 0.8556073307991028, + "eval_runtime": 526.4711, + "eval_samples_per_second": 14.51, + "eval_wer": 0.317990794476686, + "step": 80080 + }, + { + "epoch": 11.84, + "learning_rate": 4.0934718100890205e-06, + "loss": 0.9325, + "step": 80120 + }, + { + "epoch": 11.84, + "eval_loss": 0.8555437922477722, + "eval_runtime": 523.4527, + "eval_samples_per_second": 14.593, + "eval_wer": 0.31824809171217017, + "step": 80120 + }, + { + "epoch": 11.85, + "learning_rate": 4.090504451038576e-06, + "loss": 0.8948, + "step": 80160 + }, + { + "epoch": 11.85, + "eval_loss": 0.891800582408905, + "eval_runtime": 526.8176, + "eval_samples_per_second": 14.5, + "eval_wer": 0.320906829812173, + "step": 80160 + }, + { + "epoch": 11.86, + "learning_rate": 4.087537091988131e-06, + "loss": 0.9754, + "step": 80200 + }, + { + "epoch": 11.86, + "eval_loss": 0.8781245946884155, + "eval_runtime": 524.2642, + "eval_samples_per_second": 14.571, + "eval_wer": 0.31950598930787044, + "step": 80200 + }, + { + "epoch": 11.86, + "learning_rate": 4.084569732937686e-06, + "loss": 0.9984, + "step": 80240 + }, + { + "epoch": 11.86, + "eval_loss": 0.8363027572631836, + "eval_runtime": 524.2066, + "eval_samples_per_second": 14.572, + "eval_wer": 0.3182766802938906, + "step": 80240 + }, + { + "epoch": 11.87, + "learning_rate": 4.081602373887241e-06, + "loss": 0.9091, + "step": 80280 + }, + { + "epoch": 11.87, + "eval_loss": 0.8503888249397278, + "eval_runtime": 523.674, + "eval_samples_per_second": 14.587, + "eval_wer": 0.31864833185625663, + "step": 80280 + }, + { + "epoch": 11.87, + "learning_rate": 4.078635014836795e-06, + "loss": 0.9245, + "step": 80320 + }, + { + "epoch": 11.87, + "eval_loss": 0.8640632629394531, + "eval_runtime": 523.6197, + "eval_samples_per_second": 14.589, + "eval_wer": 0.31907716058206353, + "step": 80320 + }, + { + "epoch": 11.88, + "learning_rate": 4.0756676557863505e-06, + "loss": 0.9406, + "step": 80360 + }, + { + "epoch": 11.88, + "eval_loss": 0.8686935901641846, + "eval_runtime": 524.3527, + "eval_samples_per_second": 14.568, + "eval_wer": 0.3196489322164727, + "step": 80360 + }, + { + "epoch": 11.88, + "learning_rate": 4.072700296735905e-06, + "loss": 0.9242, + "step": 80400 + }, + { + "epoch": 11.88, + "eval_loss": 0.872299313545227, + "eval_runtime": 523.8128, + "eval_samples_per_second": 14.583, + "eval_wer": 0.320163526687441, + "step": 80400 + }, + { + "epoch": 11.89, + "learning_rate": 4.06973293768546e-06, + "loss": 0.9274, + "step": 80440 + }, + { + "epoch": 11.89, + "eval_loss": 0.8660278916358948, + "eval_runtime": 523.2636, + "eval_samples_per_second": 14.599, + "eval_wer": 0.32036364675948426, + "step": 80440 + }, + { + "epoch": 11.9, + "learning_rate": 4.0667655786350156e-06, + "loss": 0.9333, + "step": 80480 + }, + { + "epoch": 11.9, + "eval_loss": 0.8493769764900208, + "eval_runtime": 524.4152, + "eval_samples_per_second": 14.567, + "eval_wer": 0.3191915149089454, + "step": 80480 + }, + { + "epoch": 11.9, + "learning_rate": 4.06379821958457e-06, + "loss": 0.916, + "step": 80520 + }, + { + "epoch": 11.9, + "eval_loss": 0.8417730331420898, + "eval_runtime": 522.6634, + "eval_samples_per_second": 14.616, + "eval_wer": 0.31833385745733156, + "step": 80520 + }, + { + "epoch": 11.91, + "learning_rate": 4.060830860534125e-06, + "loss": 1.1075, + "step": 80560 + }, + { + "epoch": 11.91, + "eval_loss": 0.8455369472503662, + "eval_runtime": 522.9521, + "eval_samples_per_second": 14.607, + "eval_wer": 0.31847680036593384, + "step": 80560 + }, + { + "epoch": 11.91, + "learning_rate": 4.05786350148368e-06, + "loss": 0.9976, + "step": 80600 + }, + { + "epoch": 11.91, + "eval_loss": 0.8404129147529602, + "eval_runtime": 522.2816, + "eval_samples_per_second": 14.626, + "eval_wer": 0.31796220589496554, + "step": 80600 + }, + { + "epoch": 11.92, + "learning_rate": 4.054896142433234e-06, + "loss": 0.9124, + "step": 80640 + }, + { + "epoch": 11.92, + "eval_loss": 0.8666889071464539, + "eval_runtime": 522.9242, + "eval_samples_per_second": 14.608, + "eval_wer": 0.3198776408702364, + "step": 80640 + }, + { + "epoch": 11.93, + "learning_rate": 4.0519287833827895e-06, + "loss": 1.0873, + "step": 80680 + }, + { + "epoch": 11.93, + "eval_loss": 0.866253137588501, + "eval_runtime": 523.8556, + "eval_samples_per_second": 14.582, + "eval_wer": 0.31936304639926816, + "step": 80680 + }, + { + "epoch": 11.93, + "learning_rate": 4.048961424332345e-06, + "loss": 0.9649, + "step": 80720 + }, + { + "epoch": 11.93, + "eval_loss": 0.8646376132965088, + "eval_runtime": 523.0255, + "eval_samples_per_second": 14.605, + "eval_wer": 0.31979187512507506, + "step": 80720 + }, + { + "epoch": 11.94, + "learning_rate": 4.0459940652819e-06, + "loss": 0.9728, + "step": 80760 + }, + { + "epoch": 11.94, + "eval_loss": 0.8401035070419312, + "eval_runtime": 522.817, + "eval_samples_per_second": 14.611, + "eval_wer": 0.31796220589496554, + "step": 80760 + }, + { + "epoch": 11.94, + "learning_rate": 4.0430267062314545e-06, + "loss": 0.9577, + "step": 80800 + }, + { + "epoch": 11.94, + "eval_loss": 0.8614905476570129, + "eval_runtime": 523.6553, + "eval_samples_per_second": 14.588, + "eval_wer": 0.31907716058206353, + "step": 80800 + }, + { + "epoch": 11.95, + "learning_rate": 4.040059347181009e-06, + "loss": 1.0003, + "step": 80840 + }, + { + "epoch": 11.95, + "eval_loss": 0.8492382764816284, + "eval_runtime": 525.1191, + "eval_samples_per_second": 14.547, + "eval_wer": 0.3187055090196975, + "step": 80840 + }, + { + "epoch": 11.96, + "learning_rate": 4.037091988130564e-06, + "loss": 0.9137, + "step": 80880 + }, + { + "epoch": 11.96, + "eval_loss": 0.8892574310302734, + "eval_runtime": 523.2111, + "eval_samples_per_second": 14.6, + "eval_wer": 0.3206495325766889, + "step": 80880 + }, + { + "epoch": 11.96, + "learning_rate": 4.034124629080119e-06, + "loss": 0.8336, + "step": 80920 + }, + { + "epoch": 11.96, + "eval_loss": 0.9157854914665222, + "eval_runtime": 524.3861, + "eval_samples_per_second": 14.568, + "eval_wer": 0.32353697933045544, + "step": 80920 + }, + { + "epoch": 11.97, + "learning_rate": 4.031157270029674e-06, + "loss": 0.9144, + "step": 80960 + }, + { + "epoch": 11.97, + "eval_loss": 0.8712791204452515, + "eval_runtime": 525.5192, + "eval_samples_per_second": 14.536, + "eval_wer": 0.3199919951971183, + "step": 80960 + }, + { + "epoch": 11.97, + "learning_rate": 4.028189910979229e-06, + "loss": 0.936, + "step": 81000 + }, + { + "epoch": 11.97, + "eval_loss": 0.8820872902870178, + "eval_runtime": 525.2995, + "eval_samples_per_second": 14.542, + "eval_wer": 0.3206781211584093, + "step": 81000 + }, + { + "epoch": 11.98, + "learning_rate": 4.025222551928784e-06, + "loss": 0.939, + "step": 81040 + }, + { + "epoch": 11.98, + "eval_loss": 0.8810380101203918, + "eval_runtime": 523.0552, + "eval_samples_per_second": 14.605, + "eval_wer": 0.32036364675948426, + "step": 81040 + }, + { + "epoch": 11.99, + "learning_rate": 4.022255192878339e-06, + "loss": 0.9862, + "step": 81080 + }, + { + "epoch": 11.99, + "eval_loss": 0.8338649272918701, + "eval_runtime": 523.5922, + "eval_samples_per_second": 14.59, + "eval_wer": 0.317990794476686, + "step": 81080 + }, + { + "epoch": 11.99, + "learning_rate": 4.019287833827893e-06, + "loss": 0.95, + "step": 81120 + }, + { + "epoch": 11.99, + "eval_loss": 0.8525464534759521, + "eval_runtime": 523.1374, + "eval_samples_per_second": 14.602, + "eval_wer": 0.31839103462077245, + "step": 81120 + }, + { + "epoch": 12.0, + "learning_rate": 4.016320474777448e-06, + "loss": 0.9934, + "step": 81160 + }, + { + "epoch": 12.0, + "eval_loss": 0.8421252369880676, + "eval_runtime": 522.3005, + "eval_samples_per_second": 14.626, + "eval_wer": 0.3181909145487292, + "step": 81160 + }, + { + "epoch": 12.0, + "learning_rate": 4.013353115727003e-06, + "loss": 0.9557, + "step": 81200 + }, + { + "epoch": 12.0, + "eval_loss": 0.8127682209014893, + "eval_runtime": 521.8058, + "eval_samples_per_second": 14.64, + "eval_wer": 0.31590382801109235, + "step": 81200 + }, + { + "epoch": 12.01, + "learning_rate": 4.0103857566765584e-06, + "loss": 0.9445, + "step": 81240 + }, + { + "epoch": 12.01, + "eval_loss": 0.8823168873786926, + "eval_runtime": 523.382, + "eval_samples_per_second": 14.595, + "eval_wer": 0.32053517824980704, + "step": 81240 + }, + { + "epoch": 12.01, + "learning_rate": 4.007418397626113e-06, + "loss": 0.926, + "step": 81280 + }, + { + "epoch": 12.01, + "eval_loss": 0.8604192733764648, + "eval_runtime": 523.7119, + "eval_samples_per_second": 14.586, + "eval_wer": 0.319105749163784, + "step": 81280 + }, + { + "epoch": 12.02, + "learning_rate": 4.004451038575668e-06, + "loss": 0.9617, + "step": 81320 + }, + { + "epoch": 12.02, + "eval_loss": 0.8644814491271973, + "eval_runtime": 523.5727, + "eval_samples_per_second": 14.59, + "eval_wer": 0.31942022356270905, + "step": 81320 + }, + { + "epoch": 12.03, + "learning_rate": 4.001483679525223e-06, + "loss": 0.9855, + "step": 81360 + }, + { + "epoch": 12.03, + "eval_loss": 0.8658839464187622, + "eval_runtime": 523.7875, + "eval_samples_per_second": 14.584, + "eval_wer": 0.31924869207238626, + "step": 81360 + }, + { + "epoch": 12.03, + "learning_rate": 3.998516320474778e-06, + "loss": 0.9127, + "step": 81400 + }, + { + "epoch": 12.03, + "eval_loss": 0.862577497959137, + "eval_runtime": 530.1416, + "eval_samples_per_second": 14.409, + "eval_wer": 0.31924869207238626, + "step": 81400 + }, + { + "epoch": 12.04, + "learning_rate": 3.995548961424332e-06, + "loss": 0.9151, + "step": 81440 + }, + { + "epoch": 12.04, + "eval_loss": 0.8566737174987793, + "eval_runtime": 526.4018, + "eval_samples_per_second": 14.512, + "eval_wer": 0.31890562909174075, + "step": 81440 + }, + { + "epoch": 12.04, + "learning_rate": 3.992581602373888e-06, + "loss": 0.9916, + "step": 81480 + }, + { + "epoch": 12.04, + "eval_loss": 0.8344435095787048, + "eval_runtime": 525.466, + "eval_samples_per_second": 14.538, + "eval_wer": 0.3171331370250722, + "step": 81480 + }, + { + "epoch": 12.05, + "learning_rate": 3.989614243323443e-06, + "loss": 0.9265, + "step": 81520 + }, + { + "epoch": 12.05, + "eval_loss": 0.8394008278846741, + "eval_runtime": 525.0292, + "eval_samples_per_second": 14.55, + "eval_wer": 0.317990794476686, + "step": 81520 + }, + { + "epoch": 12.06, + "learning_rate": 3.986646884272997e-06, + "loss": 0.8672, + "step": 81560 + }, + { + "epoch": 12.06, + "eval_loss": 0.8704163432121277, + "eval_runtime": 524.4648, + "eval_samples_per_second": 14.565, + "eval_wer": 0.31959175505303183, + "step": 81560 + }, + { + "epoch": 12.06, + "learning_rate": 3.983679525222553e-06, + "loss": 1.0207, + "step": 81600 + }, + { + "epoch": 12.06, + "eval_loss": 0.8463544845581055, + "eval_runtime": 523.9294, + "eval_samples_per_second": 14.58, + "eval_wer": 0.3182766802938906, + "step": 81600 + }, + { + "epoch": 12.07, + "learning_rate": 3.980712166172107e-06, + "loss": 1.0017, + "step": 81640 + }, + { + "epoch": 12.07, + "eval_loss": 0.8295923471450806, + "eval_runtime": 525.5692, + "eval_samples_per_second": 14.535, + "eval_wer": 0.3177049086594814, + "step": 81640 + }, + { + "epoch": 12.07, + "learning_rate": 3.9777448071216615e-06, + "loss": 1.0134, + "step": 81680 + }, + { + "epoch": 12.07, + "eval_loss": 0.8416734933853149, + "eval_runtime": 524.228, + "eval_samples_per_second": 14.572, + "eval_wer": 0.3185339775293748, + "step": 81680 + }, + { + "epoch": 12.08, + "learning_rate": 3.974777448071217e-06, + "loss": 1.0137, + "step": 81720 + }, + { + "epoch": 12.08, + "eval_loss": 0.8600002527236938, + "eval_runtime": 524.9138, + "eval_samples_per_second": 14.553, + "eval_wer": 0.31881986334657936, + "step": 81720 + }, + { + "epoch": 12.09, + "learning_rate": 3.971810089020772e-06, + "loss": 0.9356, + "step": 81760 + }, + { + "epoch": 12.09, + "eval_loss": 0.8794257044792175, + "eval_runtime": 524.9097, + "eval_samples_per_second": 14.553, + "eval_wer": 0.3199919951971183, + "step": 81760 + }, + { + "epoch": 12.09, + "learning_rate": 3.9688427299703265e-06, + "loss": 0.9983, + "step": 81800 + }, + { + "epoch": 12.09, + "eval_loss": 0.8798732161521912, + "eval_runtime": 526.0733, + "eval_samples_per_second": 14.521, + "eval_wer": 0.31979187512507506, + "step": 81800 + }, + { + "epoch": 12.1, + "learning_rate": 3.965875370919882e-06, + "loss": 1.0844, + "step": 81840 + }, + { + "epoch": 12.1, + "eval_loss": 0.8300412893295288, + "eval_runtime": 524.3634, + "eval_samples_per_second": 14.568, + "eval_wer": 0.31796220589496554, + "step": 81840 + }, + { + "epoch": 12.1, + "learning_rate": 3.962908011869436e-06, + "loss": 0.894, + "step": 81880 + }, + { + "epoch": 12.1, + "eval_loss": 0.8704379796981812, + "eval_runtime": 524.1434, + "eval_samples_per_second": 14.574, + "eval_wer": 0.31956316647131133, + "step": 81880 + }, + { + "epoch": 12.11, + "learning_rate": 3.9599406528189916e-06, + "loss": 0.9677, + "step": 81920 + }, + { + "epoch": 12.11, + "eval_loss": 0.8411785364151001, + "eval_runtime": 523.6818, + "eval_samples_per_second": 14.587, + "eval_wer": 0.31839103462077245, + "step": 81920 + }, + { + "epoch": 12.12, + "learning_rate": 3.956973293768546e-06, + "loss": 0.9266, + "step": 81960 + }, + { + "epoch": 12.12, + "eval_loss": 0.8312793374061584, + "eval_runtime": 524.9319, + "eval_samples_per_second": 14.552, + "eval_wer": 0.3173332570971154, + "step": 81960 + }, + { + "epoch": 12.12, + "learning_rate": 3.954005934718101e-06, + "loss": 0.9367, + "step": 82000 + }, + { + "epoch": 12.12, + "eval_loss": 0.8514599800109863, + "eval_runtime": 523.8406, + "eval_samples_per_second": 14.583, + "eval_wer": 0.31876268618313847, + "step": 82000 + }, + { + "epoch": 12.13, + "learning_rate": 3.951038575667656e-06, + "loss": 0.9478, + "step": 82040 + }, + { + "epoch": 12.13, + "eval_loss": 0.842492938041687, + "eval_runtime": 525.6952, + "eval_samples_per_second": 14.531, + "eval_wer": 0.3176763200777609, + "step": 82040 + }, + { + "epoch": 12.13, + "learning_rate": 3.948071216617211e-06, + "loss": 0.9033, + "step": 82080 + }, + { + "epoch": 12.13, + "eval_loss": 0.8509601354598999, + "eval_runtime": 525.5831, + "eval_samples_per_second": 14.534, + "eval_wer": 0.3181909145487292, + "step": 82080 + }, + { + "epoch": 12.14, + "learning_rate": 3.945103857566766e-06, + "loss": 0.9046, + "step": 82120 + }, + { + "epoch": 12.14, + "eval_loss": 0.8761820197105408, + "eval_runtime": 528.9499, + "eval_samples_per_second": 14.442, + "eval_wer": 0.3199919951971183, + "step": 82120 + }, + { + "epoch": 12.14, + "learning_rate": 3.942136498516321e-06, + "loss": 0.9361, + "step": 82160 + }, + { + "epoch": 12.14, + "eval_loss": 0.8794522285461426, + "eval_runtime": 524.4344, + "eval_samples_per_second": 14.566, + "eval_wer": 0.320163526687441, + "step": 82160 + }, + { + "epoch": 12.15, + "learning_rate": 3.939169139465875e-06, + "loss": 0.8959, + "step": 82200 + }, + { + "epoch": 12.15, + "eval_loss": 0.8670927882194519, + "eval_runtime": 524.5051, + "eval_samples_per_second": 14.564, + "eval_wer": 0.31936304639926816, + "step": 82200 + }, + { + "epoch": 12.16, + "learning_rate": 3.9362017804154305e-06, + "loss": 0.9456, + "step": 82240 + }, + { + "epoch": 12.16, + "eval_loss": 0.8616918325424194, + "eval_runtime": 525.6548, + "eval_samples_per_second": 14.532, + "eval_wer": 0.31830526887561106, + "step": 82240 + }, + { + "epoch": 12.16, + "learning_rate": 3.933234421364985e-06, + "loss": 0.9474, + "step": 82280 + }, + { + "epoch": 12.16, + "eval_loss": 0.836297869682312, + "eval_runtime": 526.5157, + "eval_samples_per_second": 14.509, + "eval_wer": 0.31636124531861975, + "step": 82280 + }, + { + "epoch": 12.17, + "learning_rate": 3.93026706231454e-06, + "loss": 0.9871, + "step": 82320 + }, + { + "epoch": 12.17, + "eval_loss": 0.8510875105857849, + "eval_runtime": 524.7113, + "eval_samples_per_second": 14.558, + "eval_wer": 0.31761914291432003, + "step": 82320 + }, + { + "epoch": 12.17, + "learning_rate": 3.9272997032640955e-06, + "loss": 0.9386, + "step": 82360 + }, + { + "epoch": 12.17, + "eval_loss": 0.8552115559577942, + "eval_runtime": 525.1912, + "eval_samples_per_second": 14.545, + "eval_wer": 0.31730466851539496, + "step": 82360 + }, + { + "epoch": 12.18, + "learning_rate": 3.92433234421365e-06, + "loss": 0.8224, + "step": 82400 + }, + { + "epoch": 12.18, + "eval_loss": 0.9090474843978882, + "eval_runtime": 525.6144, + "eval_samples_per_second": 14.533, + "eval_wer": 0.3214500128648618, + "step": 82400 + }, + { + "epoch": 12.19, + "learning_rate": 3.921364985163205e-06, + "loss": 0.9441, + "step": 82440 + }, + { + "epoch": 12.19, + "eval_loss": 0.8947290182113647, + "eval_runtime": 524.4844, + "eval_samples_per_second": 14.565, + "eval_wer": 0.32027788101432286, + "step": 82440 + }, + { + "epoch": 12.19, + "learning_rate": 3.91839762611276e-06, + "loss": 0.9437, + "step": 82480 + }, + { + "epoch": 12.19, + "eval_loss": 0.8780737519264221, + "eval_runtime": 525.5659, + "eval_samples_per_second": 14.535, + "eval_wer": 0.3182195031304497, + "step": 82480 + }, + { + "epoch": 12.2, + "learning_rate": 3.915430267062315e-06, + "loss": 0.976, + "step": 82520 + }, + { + "epoch": 12.2, + "eval_loss": 0.8858648538589478, + "eval_runtime": 524.9287, + "eval_samples_per_second": 14.552, + "eval_wer": 0.31927728065410677, + "step": 82520 + }, + { + "epoch": 12.2, + "learning_rate": 3.912462908011869e-06, + "loss": 0.9769, + "step": 82560 + }, + { + "epoch": 12.2, + "eval_loss": 0.8566499352455139, + "eval_runtime": 526.5462, + "eval_samples_per_second": 14.508, + "eval_wer": 0.31684725120786755, + "step": 82560 + }, + { + "epoch": 12.21, + "learning_rate": 3.909495548961425e-06, + "loss": 0.9815, + "step": 82600 + }, + { + "epoch": 12.21, + "eval_loss": 0.8553969860076904, + "eval_runtime": 525.3069, + "eval_samples_per_second": 14.542, + "eval_wer": 0.3170473712799108, + "step": 82600 + }, + { + "epoch": 12.22, + "learning_rate": 3.90652818991098e-06, + "loss": 0.9333, + "step": 82640 + }, + { + "epoch": 12.22, + "eval_loss": 0.8499127626419067, + "eval_runtime": 527.2344, + "eval_samples_per_second": 14.489, + "eval_wer": 0.3163326567368993, + "step": 82640 + }, + { + "epoch": 12.22, + "learning_rate": 3.9035608308605344e-06, + "loss": 0.9191, + "step": 82680 + }, + { + "epoch": 12.22, + "eval_loss": 0.8496977090835571, + "eval_runtime": 525.6198, + "eval_samples_per_second": 14.533, + "eval_wer": 0.3166757197175448, + "step": 82680 + }, + { + "epoch": 12.23, + "learning_rate": 3.900593471810089e-06, + "loss": 1.0383, + "step": 82720 + }, + { + "epoch": 12.23, + "eval_loss": 0.8403531312942505, + "eval_runtime": 525.391, + "eval_samples_per_second": 14.54, + "eval_wer": 0.31607535950141513, + "step": 82720 + }, + { + "epoch": 12.23, + "learning_rate": 3.897626112759644e-06, + "loss": 0.9358, + "step": 82760 + }, + { + "epoch": 12.23, + "eval_loss": 0.8650328516960144, + "eval_runtime": 525.1898, + "eval_samples_per_second": 14.545, + "eval_wer": 0.31773349724120187, + "step": 82760 + }, + { + "epoch": 12.24, + "learning_rate": 3.894658753709199e-06, + "loss": 0.9483, + "step": 82800 + }, + { + "epoch": 12.24, + "eval_loss": 0.8575060963630676, + "eval_runtime": 525.8886, + "eval_samples_per_second": 14.526, + "eval_wer": 0.31761914291432003, + "step": 82800 + }, + { + "epoch": 12.25, + "learning_rate": 3.891691394658754e-06, + "loss": 0.9819, + "step": 82840 + }, + { + "epoch": 12.25, + "eval_loss": 0.8330111503601074, + "eval_runtime": 525.3274, + "eval_samples_per_second": 14.541, + "eval_wer": 0.3162468909917379, + "step": 82840 + }, + { + "epoch": 12.25, + "learning_rate": 3.888724035608309e-06, + "loss": 0.961, + "step": 82880 + }, + { + "epoch": 12.25, + "eval_loss": 0.826102077960968, + "eval_runtime": 525.2839, + "eval_samples_per_second": 14.543, + "eval_wer": 0.3153606449584036, + "step": 82880 + }, + { + "epoch": 12.26, + "learning_rate": 3.885756676557864e-06, + "loss": 0.9158, + "step": 82920 + }, + { + "epoch": 12.26, + "eval_loss": 0.862916111946106, + "eval_runtime": 525.648, + "eval_samples_per_second": 14.533, + "eval_wer": 0.3184482117842134, + "step": 82920 + }, + { + "epoch": 12.26, + "learning_rate": 3.882789317507419e-06, + "loss": 1.0635, + "step": 82960 + }, + { + "epoch": 12.26, + "eval_loss": 0.8371991515159607, + "eval_runtime": 530.0963, + "eval_samples_per_second": 14.411, + "eval_wer": 0.3161325366648561, + "step": 82960 + }, + { + "epoch": 12.27, + "learning_rate": 3.879821958456973e-06, + "loss": 0.923, + "step": 83000 + }, + { + "epoch": 12.27, + "eval_loss": 0.8373926877975464, + "eval_runtime": 526.0901, + "eval_samples_per_second": 14.52, + "eval_wer": 0.3165327768089425, + "step": 83000 + }, + { + "epoch": 12.27, + "learning_rate": 3.876854599406529e-06, + "loss": 0.9321, + "step": 83040 + }, + { + "epoch": 12.27, + "eval_loss": 0.8375298380851746, + "eval_runtime": 526.6641, + "eval_samples_per_second": 14.505, + "eval_wer": 0.31618971382829697, + "step": 83040 + }, + { + "epoch": 12.28, + "learning_rate": 3.873887240356083e-06, + "loss": 0.9645, + "step": 83080 + }, + { + "epoch": 12.28, + "eval_loss": 0.8143869042396545, + "eval_runtime": 526.1403, + "eval_samples_per_second": 14.519, + "eval_wer": 0.3148746390691558, + "step": 83080 + }, + { + "epoch": 12.29, + "learning_rate": 3.870919881305638e-06, + "loss": 0.9869, + "step": 83120 + }, + { + "epoch": 12.29, + "eval_loss": 0.8510050773620605, + "eval_runtime": 528.1352, + "eval_samples_per_second": 14.464, + "eval_wer": 0.3173332570971154, + "step": 83120 + }, + { + "epoch": 12.29, + "learning_rate": 3.867952522255194e-06, + "loss": 0.995, + "step": 83160 + }, + { + "epoch": 12.29, + "eval_loss": 0.862872302532196, + "eval_runtime": 526.0117, + "eval_samples_per_second": 14.522, + "eval_wer": 0.3188770405100203, + "step": 83160 + }, + { + "epoch": 12.3, + "learning_rate": 3.864985163204748e-06, + "loss": 0.9564, + "step": 83200 + }, + { + "epoch": 12.3, + "eval_loss": 0.861678421497345, + "eval_runtime": 525.2189, + "eval_samples_per_second": 14.544, + "eval_wer": 0.31841962320249295, + "step": 83200 + }, + { + "epoch": 12.3, + "learning_rate": 3.8620178041543025e-06, + "loss": 0.9611, + "step": 83240 + }, + { + "epoch": 12.3, + "eval_loss": 0.8469088673591614, + "eval_runtime": 527.2918, + "eval_samples_per_second": 14.487, + "eval_wer": 0.3174762000057177, + "step": 83240 + }, + { + "epoch": 12.31, + "learning_rate": 3.859050445103858e-06, + "loss": 0.9576, + "step": 83280 + }, + { + "epoch": 12.31, + "eval_loss": 0.8363614082336426, + "eval_runtime": 525.082, + "eval_samples_per_second": 14.548, + "eval_wer": 0.3167328968809857, + "step": 83280 + }, + { + "epoch": 12.32, + "learning_rate": 3.856083086053412e-06, + "loss": 0.9516, + "step": 83320 + }, + { + "epoch": 12.32, + "eval_loss": 0.8579716086387634, + "eval_runtime": 531.1501, + "eval_samples_per_second": 14.382, + "eval_wer": 0.31830526887561106, + "step": 83320 + }, + { + "epoch": 12.32, + "learning_rate": 3.8531157270029676e-06, + "loss": 1.0121, + "step": 83360 + }, + { + "epoch": 12.32, + "eval_loss": 0.8444721698760986, + "eval_runtime": 527.8495, + "eval_samples_per_second": 14.472, + "eval_wer": 0.3175047885874382, + "step": 83360 + }, + { + "epoch": 12.33, + "learning_rate": 3.850148367952523e-06, + "loss": 1.0881, + "step": 83400 + }, + { + "epoch": 12.33, + "eval_loss": 0.8379129767417908, + "eval_runtime": 530.3179, + "eval_samples_per_second": 14.405, + "eval_wer": 0.3169901941164699, + "step": 83400 + }, + { + "epoch": 12.33, + "learning_rate": 3.847181008902077e-06, + "loss": 0.9776, + "step": 83440 + }, + { + "epoch": 12.33, + "eval_loss": 0.8223641514778137, + "eval_runtime": 529.4099, + "eval_samples_per_second": 14.429, + "eval_wer": 0.3161039480831356, + "step": 83440 + }, + { + "epoch": 12.34, + "learning_rate": 3.844213649851633e-06, + "loss": 0.97, + "step": 83480 + }, + { + "epoch": 12.34, + "eval_loss": 0.8225669264793396, + "eval_runtime": 532.1561, + "eval_samples_per_second": 14.355, + "eval_wer": 0.31627547957345836, + "step": 83480 + }, + { + "epoch": 12.35, + "learning_rate": 3.841246290801187e-06, + "loss": 1.0239, + "step": 83520 + }, + { + "epoch": 12.35, + "eval_loss": 0.8068982362747192, + "eval_runtime": 527.6683, + "eval_samples_per_second": 14.477, + "eval_wer": 0.31556076503044683, + "step": 83520 + }, + { + "epoch": 12.35, + "learning_rate": 3.838278931750742e-06, + "loss": 0.9029, + "step": 83560 + }, + { + "epoch": 12.35, + "eval_loss": 0.8129993677139282, + "eval_runtime": 526.7002, + "eval_samples_per_second": 14.504, + "eval_wer": 0.3152177020498013, + "step": 83560 + }, + { + "epoch": 12.36, + "learning_rate": 3.835311572700297e-06, + "loss": 0.9078, + "step": 83600 + }, + { + "epoch": 12.36, + "eval_loss": 0.8551590442657471, + "eval_runtime": 525.9709, + "eval_samples_per_second": 14.524, + "eval_wer": 0.31779067440464276, + "step": 83600 + }, + { + "epoch": 12.36, + "learning_rate": 3.832344213649852e-06, + "loss": 0.9009, + "step": 83640 + }, + { + "epoch": 12.36, + "eval_loss": 0.8711938261985779, + "eval_runtime": 526.0821, + "eval_samples_per_second": 14.521, + "eval_wer": 0.3192201034906658, + "step": 83640 + }, + { + "epoch": 12.37, + "learning_rate": 3.829376854599407e-06, + "loss": 0.9908, + "step": 83680 + }, + { + "epoch": 12.37, + "eval_loss": 0.8526556491851807, + "eval_runtime": 527.7971, + "eval_samples_per_second": 14.473, + "eval_wer": 0.3171903141885131, + "step": 83680 + }, + { + "epoch": 12.38, + "learning_rate": 3.826409495548962e-06, + "loss": 0.9484, + "step": 83720 + }, + { + "epoch": 12.38, + "eval_loss": 0.854936420917511, + "eval_runtime": 527.6903, + "eval_samples_per_second": 14.476, + "eval_wer": 0.3180765602218474, + "step": 83720 + }, + { + "epoch": 12.38, + "learning_rate": 3.823442136498516e-06, + "loss": 0.9649, + "step": 83760 + }, + { + "epoch": 12.38, + "eval_loss": 0.8317233324050903, + "eval_runtime": 527.8211, + "eval_samples_per_second": 14.473, + "eval_wer": 0.3167328968809857, + "step": 83760 + }, + { + "epoch": 12.39, + "learning_rate": 3.8204747774480715e-06, + "loss": 0.9479, + "step": 83800 + }, + { + "epoch": 12.39, + "eval_loss": 0.8195405006408691, + "eval_runtime": 526.4265, + "eval_samples_per_second": 14.511, + "eval_wer": 0.31607535950141513, + "step": 83800 + }, + { + "epoch": 12.39, + "learning_rate": 3.817507418397626e-06, + "loss": 0.9783, + "step": 83840 + }, + { + "epoch": 12.39, + "eval_loss": 0.8198297619819641, + "eval_runtime": 528.0249, + "eval_samples_per_second": 14.467, + "eval_wer": 0.3163326567368993, + "step": 83840 + }, + { + "epoch": 12.4, + "learning_rate": 3.8145400593471817e-06, + "loss": 0.9232, + "step": 83880 + }, + { + "epoch": 12.4, + "eval_loss": 0.840001106262207, + "eval_runtime": 526.6512, + "eval_samples_per_second": 14.505, + "eval_wer": 0.3176477314960405, + "step": 83880 + }, + { + "epoch": 12.4, + "learning_rate": 3.811572700296736e-06, + "loss": 0.9353, + "step": 83920 + }, + { + "epoch": 12.4, + "eval_loss": 0.8571428656578064, + "eval_runtime": 527.2577, + "eval_samples_per_second": 14.488, + "eval_wer": 0.31841962320249295, + "step": 83920 + }, + { + "epoch": 12.41, + "learning_rate": 3.808605341246291e-06, + "loss": 0.9092, + "step": 83960 + }, + { + "epoch": 12.41, + "eval_loss": 0.8407711386680603, + "eval_runtime": 525.1823, + "eval_samples_per_second": 14.545, + "eval_wer": 0.31736184567883585, + "step": 83960 + }, + { + "epoch": 12.42, + "learning_rate": 3.8056379821958463e-06, + "loss": 1.033, + "step": 84000 + }, + { + "epoch": 12.42, + "eval_loss": 0.8281084895133972, + "eval_runtime": 526.9442, + "eval_samples_per_second": 14.497, + "eval_wer": 0.3167614854627062, + "step": 84000 + } + ], + "max_steps": 135300, + "num_train_epochs": 20, + "total_flos": 1.856322480873076e+20, + "trial_name": null, + "trial_params": null +}