|
{ |
|
"best_metric": 0.026571398600935936, |
|
"best_model_checkpoint": "/home/cloudwalker/ASVmodel/facebook_wav2vec2-base/checkpoint-100", |
|
"epoch": 9.98109640831758, |
|
"eval_steps": 100, |
|
"global_step": 3960, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.25, |
|
"learning_rate": 7.575757575757576e-05, |
|
"loss": 0.352, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_accuracy": 0.9960553856061826, |
|
"eval_loss": 0.026571398600935936, |
|
"eval_runtime": 488.9037, |
|
"eval_samples_per_second": 50.816, |
|
"eval_steps_per_second": 25.408, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 0.00015151515151515152, |
|
"loss": 0.2689, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_accuracy": 0.980800193205603, |
|
"eval_loss": 0.21770231425762177, |
|
"eval_runtime": 491.786, |
|
"eval_samples_per_second": 50.518, |
|
"eval_steps_per_second": 25.259, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"learning_rate": 0.00022727272727272725, |
|
"loss": 1.2723, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"eval_accuracy": 0.992432780550636, |
|
"eval_loss": 0.035364724695682526, |
|
"eval_runtime": 491.4276, |
|
"eval_samples_per_second": 50.555, |
|
"eval_steps_per_second": 25.277, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"learning_rate": 0.00029966329966329963, |
|
"loss": 0.6624, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4243304133415222, |
|
"eval_runtime": 491.3199, |
|
"eval_samples_per_second": 50.566, |
|
"eval_steps_per_second": 25.283, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"learning_rate": 0.00029124579124579125, |
|
"loss": 0.5959, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4804568290710449, |
|
"eval_runtime": 491.6703, |
|
"eval_samples_per_second": 50.53, |
|
"eval_steps_per_second": 25.265, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"learning_rate": 0.0002828282828282828, |
|
"loss": 0.594, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4400762617588043, |
|
"eval_runtime": 491.6688, |
|
"eval_samples_per_second": 50.53, |
|
"eval_steps_per_second": 25.265, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 0.0002744107744107744, |
|
"loss": 0.6017, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4308442175388336, |
|
"eval_runtime": 491.729, |
|
"eval_samples_per_second": 50.524, |
|
"eval_steps_per_second": 25.262, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"learning_rate": 0.00026599326599326595, |
|
"loss": 0.5973, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.39036858081817627, |
|
"eval_runtime": 491.5847, |
|
"eval_samples_per_second": 50.539, |
|
"eval_steps_per_second": 25.269, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"learning_rate": 0.00025757575757575756, |
|
"loss": 0.6096, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4003813862800598, |
|
"eval_runtime": 491.46, |
|
"eval_samples_per_second": 50.551, |
|
"eval_steps_per_second": 25.276, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"learning_rate": 0.00024915824915824913, |
|
"loss": 0.5936, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41795614361763, |
|
"eval_runtime": 491.8429, |
|
"eval_samples_per_second": 50.512, |
|
"eval_steps_per_second": 25.256, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"learning_rate": 0.00024074074074074072, |
|
"loss": 0.5932, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4600105881690979, |
|
"eval_runtime": 491.5387, |
|
"eval_samples_per_second": 50.543, |
|
"eval_steps_per_second": 25.272, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"learning_rate": 0.0002323232323232323, |
|
"loss": 0.5884, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4334673285484314, |
|
"eval_runtime": 491.9313, |
|
"eval_samples_per_second": 50.503, |
|
"eval_steps_per_second": 25.251, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"learning_rate": 0.0002239057239057239, |
|
"loss": 0.5815, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.37108397483825684, |
|
"eval_runtime": 491.7823, |
|
"eval_samples_per_second": 50.518, |
|
"eval_steps_per_second": 25.259, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"learning_rate": 0.00021548821548821544, |
|
"loss": 0.5923, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4266449213027954, |
|
"eval_runtime": 491.763, |
|
"eval_samples_per_second": 50.52, |
|
"eval_steps_per_second": 25.26, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.78, |
|
"learning_rate": 0.00020707070707070703, |
|
"loss": 0.6062, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.78, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4494142532348633, |
|
"eval_runtime": 491.657, |
|
"eval_samples_per_second": 50.531, |
|
"eval_steps_per_second": 25.266, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"learning_rate": 0.00019865319865319862, |
|
"loss": 0.6025, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.40983960032463074, |
|
"eval_runtime": 491.6314, |
|
"eval_samples_per_second": 50.534, |
|
"eval_steps_per_second": 25.267, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"learning_rate": 0.00019023569023569022, |
|
"loss": 0.5907, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.3796265125274658, |
|
"eval_runtime": 491.8727, |
|
"eval_samples_per_second": 50.509, |
|
"eval_steps_per_second": 25.255, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.54, |
|
"learning_rate": 0.0001818181818181818, |
|
"loss": 0.5933, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.54, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.41142529249191284, |
|
"eval_runtime": 491.9136, |
|
"eval_samples_per_second": 50.505, |
|
"eval_steps_per_second": 25.252, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.79, |
|
"learning_rate": 0.0001734006734006734, |
|
"loss": 0.5997, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 4.79, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4283621311187744, |
|
"eval_runtime": 492.0918, |
|
"eval_samples_per_second": 50.487, |
|
"eval_steps_per_second": 25.243, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 5.04, |
|
"learning_rate": 0.000164983164983165, |
|
"loss": 0.6028, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.04, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4269249737262726, |
|
"eval_runtime": 492.0087, |
|
"eval_samples_per_second": 50.495, |
|
"eval_steps_per_second": 25.248, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.29, |
|
"learning_rate": 0.00015656565656565653, |
|
"loss": 0.5936, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 5.29, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4423413872718811, |
|
"eval_runtime": 492.1387, |
|
"eval_samples_per_second": 50.482, |
|
"eval_steps_per_second": 25.241, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 5.55, |
|
"learning_rate": 0.00014814814814814812, |
|
"loss": 0.5994, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 5.55, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.43968868255615234, |
|
"eval_runtime": 491.824, |
|
"eval_samples_per_second": 50.514, |
|
"eval_steps_per_second": 25.257, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"learning_rate": 0.0001397306397306397, |
|
"loss": 0.5937, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.43047070503234863, |
|
"eval_runtime": 492.196, |
|
"eval_samples_per_second": 50.476, |
|
"eval_steps_per_second": 25.238, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 6.05, |
|
"learning_rate": 0.0001313131313131313, |
|
"loss": 0.5958, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 6.05, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.43379682302474976, |
|
"eval_runtime": 492.4115, |
|
"eval_samples_per_second": 50.454, |
|
"eval_steps_per_second": 25.227, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 6.3, |
|
"learning_rate": 0.0001228956228956229, |
|
"loss": 0.5984, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.3, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.394501656293869, |
|
"eval_runtime": 491.7814, |
|
"eval_samples_per_second": 50.518, |
|
"eval_steps_per_second": 25.259, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"learning_rate": 0.00011447811447811446, |
|
"loss": 0.5943, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.38777557015419006, |
|
"eval_runtime": 492.0653, |
|
"eval_samples_per_second": 50.489, |
|
"eval_steps_per_second": 25.245, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 6.81, |
|
"learning_rate": 0.00010606060606060605, |
|
"loss": 0.5819, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 6.81, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42347970604896545, |
|
"eval_runtime": 491.9589, |
|
"eval_samples_per_second": 50.5, |
|
"eval_steps_per_second": 25.25, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"learning_rate": 9.764309764309764e-05, |
|
"loss": 0.594, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4160361886024475, |
|
"eval_runtime": 491.6691, |
|
"eval_samples_per_second": 50.53, |
|
"eval_steps_per_second": 25.265, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 7.31, |
|
"learning_rate": 8.92255892255892e-05, |
|
"loss": 0.5883, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 7.31, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4075636565685272, |
|
"eval_runtime": 492.0942, |
|
"eval_samples_per_second": 50.486, |
|
"eval_steps_per_second": 25.243, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 7.56, |
|
"learning_rate": 8.08080808080808e-05, |
|
"loss": 0.5877, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.56, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4212785065174103, |
|
"eval_runtime": 491.8, |
|
"eval_samples_per_second": 50.516, |
|
"eval_steps_per_second": 25.258, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"learning_rate": 7.239057239057239e-05, |
|
"loss": 0.5939, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4088614583015442, |
|
"eval_runtime": 492.134, |
|
"eval_samples_per_second": 50.482, |
|
"eval_steps_per_second": 25.241, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 8.07, |
|
"learning_rate": 6.397306397306397e-05, |
|
"loss": 0.6025, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 8.07, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4384858310222626, |
|
"eval_runtime": 491.7955, |
|
"eval_samples_per_second": 50.517, |
|
"eval_steps_per_second": 25.258, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"learning_rate": 5.5555555555555545e-05, |
|
"loss": 0.6016, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4373140335083008, |
|
"eval_runtime": 491.7882, |
|
"eval_samples_per_second": 50.518, |
|
"eval_steps_per_second": 25.259, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 8.57, |
|
"learning_rate": 4.7138047138047136e-05, |
|
"loss": 0.5815, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 8.57, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4190850555896759, |
|
"eval_runtime": 492.4127, |
|
"eval_samples_per_second": 50.454, |
|
"eval_steps_per_second": 25.227, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 8.82, |
|
"learning_rate": 3.8720538720538714e-05, |
|
"loss": 0.5915, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.82, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4215960204601288, |
|
"eval_runtime": 491.8471, |
|
"eval_samples_per_second": 50.512, |
|
"eval_steps_per_second": 25.256, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 9.07, |
|
"learning_rate": 3.03030303030303e-05, |
|
"loss": 0.602, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 9.07, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4336757957935333, |
|
"eval_runtime": 491.8986, |
|
"eval_samples_per_second": 50.506, |
|
"eval_steps_per_second": 25.253, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 2.1885521885521884e-05, |
|
"loss": 0.5907, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4128669798374176, |
|
"eval_runtime": 491.7648, |
|
"eval_samples_per_second": 50.52, |
|
"eval_steps_per_second": 25.26, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 9.58, |
|
"learning_rate": 1.3468013468013465e-05, |
|
"loss": 0.603, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 9.58, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.4216155707836151, |
|
"eval_runtime": 491.5621, |
|
"eval_samples_per_second": 50.541, |
|
"eval_steps_per_second": 25.27, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"learning_rate": 5.05050505050505e-06, |
|
"loss": 0.593, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"eval_accuracy": 0.8974400257607471, |
|
"eval_loss": 0.42267537117004395, |
|
"eval_runtime": 491.786, |
|
"eval_samples_per_second": 50.518, |
|
"eval_steps_per_second": 25.259, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 9.98, |
|
"step": 3960, |
|
"total_flos": 1.5053705916862923e+19, |
|
"train_loss": 0.5994764679610127, |
|
"train_runtime": 37020.076, |
|
"train_samples_per_second": 6.856, |
|
"train_steps_per_second": 0.107 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 3960, |
|
"num_train_epochs": 10, |
|
"save_steps": 100, |
|
"total_flos": 1.5053705916862923e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|