{ "best_metric": 0.026571398600935936, "best_model_checkpoint": "/home/cloudwalker/ASVmodel/facebook_wav2vec2-base/checkpoint-100", "epoch": 9.98109640831758, "eval_steps": 100, "global_step": 3960, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.25, "learning_rate": 7.575757575757576e-05, "loss": 0.352, "step": 100 }, { "epoch": 0.25, "eval_accuracy": 0.9960553856061826, "eval_loss": 0.026571398600935936, "eval_runtime": 488.9037, "eval_samples_per_second": 50.816, "eval_steps_per_second": 25.408, "step": 100 }, { "epoch": 0.5, "learning_rate": 0.00015151515151515152, "loss": 0.2689, "step": 200 }, { "epoch": 0.5, "eval_accuracy": 0.980800193205603, "eval_loss": 0.21770231425762177, "eval_runtime": 491.786, "eval_samples_per_second": 50.518, "eval_steps_per_second": 25.259, "step": 200 }, { "epoch": 0.76, "learning_rate": 0.00022727272727272725, "loss": 1.2723, "step": 300 }, { "epoch": 0.76, "eval_accuracy": 0.992432780550636, "eval_loss": 0.035364724695682526, "eval_runtime": 491.4276, "eval_samples_per_second": 50.555, "eval_steps_per_second": 25.277, "step": 300 }, { "epoch": 1.01, "learning_rate": 0.00029966329966329963, "loss": 0.6624, "step": 400 }, { "epoch": 1.01, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4243304133415222, "eval_runtime": 491.3199, "eval_samples_per_second": 50.566, "eval_steps_per_second": 25.283, "step": 400 }, { "epoch": 1.26, "learning_rate": 0.00029124579124579125, "loss": 0.5959, "step": 500 }, { "epoch": 1.26, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4804568290710449, "eval_runtime": 491.6703, "eval_samples_per_second": 50.53, "eval_steps_per_second": 25.265, "step": 500 }, { "epoch": 1.51, "learning_rate": 0.0002828282828282828, "loss": 0.594, "step": 600 }, { "epoch": 1.51, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4400762617588043, "eval_runtime": 491.6688, "eval_samples_per_second": 50.53, "eval_steps_per_second": 25.265, "step": 600 }, { "epoch": 1.76, "learning_rate": 0.0002744107744107744, "loss": 0.6017, "step": 700 }, { "epoch": 1.76, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4308442175388336, "eval_runtime": 491.729, "eval_samples_per_second": 50.524, "eval_steps_per_second": 25.262, "step": 700 }, { "epoch": 2.02, "learning_rate": 0.00026599326599326595, "loss": 0.5973, "step": 800 }, { "epoch": 2.02, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.39036858081817627, "eval_runtime": 491.5847, "eval_samples_per_second": 50.539, "eval_steps_per_second": 25.269, "step": 800 }, { "epoch": 2.27, "learning_rate": 0.00025757575757575756, "loss": 0.6096, "step": 900 }, { "epoch": 2.27, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4003813862800598, "eval_runtime": 491.46, "eval_samples_per_second": 50.551, "eval_steps_per_second": 25.276, "step": 900 }, { "epoch": 2.52, "learning_rate": 0.00024915824915824913, "loss": 0.5936, "step": 1000 }, { "epoch": 2.52, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.41795614361763, "eval_runtime": 491.8429, "eval_samples_per_second": 50.512, "eval_steps_per_second": 25.256, "step": 1000 }, { "epoch": 2.77, "learning_rate": 0.00024074074074074072, "loss": 0.5932, "step": 1100 }, { "epoch": 2.77, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4600105881690979, "eval_runtime": 491.5387, "eval_samples_per_second": 50.543, "eval_steps_per_second": 25.272, "step": 1100 }, { "epoch": 3.02, "learning_rate": 0.0002323232323232323, "loss": 0.5884, "step": 1200 }, { "epoch": 3.02, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4334673285484314, "eval_runtime": 491.9313, "eval_samples_per_second": 50.503, "eval_steps_per_second": 25.251, "step": 1200 }, { "epoch": 3.28, "learning_rate": 0.0002239057239057239, "loss": 0.5815, "step": 1300 }, { "epoch": 3.28, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.37108397483825684, "eval_runtime": 491.7823, "eval_samples_per_second": 50.518, "eval_steps_per_second": 25.259, "step": 1300 }, { "epoch": 3.53, "learning_rate": 0.00021548821548821544, "loss": 0.5923, "step": 1400 }, { "epoch": 3.53, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4266449213027954, "eval_runtime": 491.763, "eval_samples_per_second": 50.52, "eval_steps_per_second": 25.26, "step": 1400 }, { "epoch": 3.78, "learning_rate": 0.00020707070707070703, "loss": 0.6062, "step": 1500 }, { "epoch": 3.78, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4494142532348633, "eval_runtime": 491.657, "eval_samples_per_second": 50.531, "eval_steps_per_second": 25.266, "step": 1500 }, { "epoch": 4.03, "learning_rate": 0.00019865319865319862, "loss": 0.6025, "step": 1600 }, { "epoch": 4.03, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.40983960032463074, "eval_runtime": 491.6314, "eval_samples_per_second": 50.534, "eval_steps_per_second": 25.267, "step": 1600 }, { "epoch": 4.28, "learning_rate": 0.00019023569023569022, "loss": 0.5907, "step": 1700 }, { "epoch": 4.28, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.3796265125274658, "eval_runtime": 491.8727, "eval_samples_per_second": 50.509, "eval_steps_per_second": 25.255, "step": 1700 }, { "epoch": 4.54, "learning_rate": 0.0001818181818181818, "loss": 0.5933, "step": 1800 }, { "epoch": 4.54, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.41142529249191284, "eval_runtime": 491.9136, "eval_samples_per_second": 50.505, "eval_steps_per_second": 25.252, "step": 1800 }, { "epoch": 4.79, "learning_rate": 0.0001734006734006734, "loss": 0.5997, "step": 1900 }, { "epoch": 4.79, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4283621311187744, "eval_runtime": 492.0918, "eval_samples_per_second": 50.487, "eval_steps_per_second": 25.243, "step": 1900 }, { "epoch": 5.04, "learning_rate": 0.000164983164983165, "loss": 0.6028, "step": 2000 }, { "epoch": 5.04, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4269249737262726, "eval_runtime": 492.0087, "eval_samples_per_second": 50.495, "eval_steps_per_second": 25.248, "step": 2000 }, { "epoch": 5.29, "learning_rate": 0.00015656565656565653, "loss": 0.5936, "step": 2100 }, { "epoch": 5.29, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4423413872718811, "eval_runtime": 492.1387, "eval_samples_per_second": 50.482, "eval_steps_per_second": 25.241, "step": 2100 }, { "epoch": 5.55, "learning_rate": 0.00014814814814814812, "loss": 0.5994, "step": 2200 }, { "epoch": 5.55, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.43968868255615234, "eval_runtime": 491.824, "eval_samples_per_second": 50.514, "eval_steps_per_second": 25.257, "step": 2200 }, { "epoch": 5.8, "learning_rate": 0.0001397306397306397, "loss": 0.5937, "step": 2300 }, { "epoch": 5.8, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.43047070503234863, "eval_runtime": 492.196, "eval_samples_per_second": 50.476, "eval_steps_per_second": 25.238, "step": 2300 }, { "epoch": 6.05, "learning_rate": 0.0001313131313131313, "loss": 0.5958, "step": 2400 }, { "epoch": 6.05, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.43379682302474976, "eval_runtime": 492.4115, "eval_samples_per_second": 50.454, "eval_steps_per_second": 25.227, "step": 2400 }, { "epoch": 6.3, "learning_rate": 0.0001228956228956229, "loss": 0.5984, "step": 2500 }, { "epoch": 6.3, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.394501656293869, "eval_runtime": 491.7814, "eval_samples_per_second": 50.518, "eval_steps_per_second": 25.259, "step": 2500 }, { "epoch": 6.55, "learning_rate": 0.00011447811447811446, "loss": 0.5943, "step": 2600 }, { "epoch": 6.55, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.38777557015419006, "eval_runtime": 492.0653, "eval_samples_per_second": 50.489, "eval_steps_per_second": 25.245, "step": 2600 }, { "epoch": 6.81, "learning_rate": 0.00010606060606060605, "loss": 0.5819, "step": 2700 }, { "epoch": 6.81, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.42347970604896545, "eval_runtime": 491.9589, "eval_samples_per_second": 50.5, "eval_steps_per_second": 25.25, "step": 2700 }, { "epoch": 7.06, "learning_rate": 9.764309764309764e-05, "loss": 0.594, "step": 2800 }, { "epoch": 7.06, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4160361886024475, "eval_runtime": 491.6691, "eval_samples_per_second": 50.53, "eval_steps_per_second": 25.265, "step": 2800 }, { "epoch": 7.31, "learning_rate": 8.92255892255892e-05, "loss": 0.5883, "step": 2900 }, { "epoch": 7.31, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4075636565685272, "eval_runtime": 492.0942, "eval_samples_per_second": 50.486, "eval_steps_per_second": 25.243, "step": 2900 }, { "epoch": 7.56, "learning_rate": 8.08080808080808e-05, "loss": 0.5877, "step": 3000 }, { "epoch": 7.56, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4212785065174103, "eval_runtime": 491.8, "eval_samples_per_second": 50.516, "eval_steps_per_second": 25.258, "step": 3000 }, { "epoch": 7.81, "learning_rate": 7.239057239057239e-05, "loss": 0.5939, "step": 3100 }, { "epoch": 7.81, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4088614583015442, "eval_runtime": 492.134, "eval_samples_per_second": 50.482, "eval_steps_per_second": 25.241, "step": 3100 }, { "epoch": 8.07, "learning_rate": 6.397306397306397e-05, "loss": 0.6025, "step": 3200 }, { "epoch": 8.07, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4384858310222626, "eval_runtime": 491.7955, "eval_samples_per_second": 50.517, "eval_steps_per_second": 25.258, "step": 3200 }, { "epoch": 8.32, "learning_rate": 5.5555555555555545e-05, "loss": 0.6016, "step": 3300 }, { "epoch": 8.32, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4373140335083008, "eval_runtime": 491.7882, "eval_samples_per_second": 50.518, "eval_steps_per_second": 25.259, "step": 3300 }, { "epoch": 8.57, "learning_rate": 4.7138047138047136e-05, "loss": 0.5815, "step": 3400 }, { "epoch": 8.57, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4190850555896759, "eval_runtime": 492.4127, "eval_samples_per_second": 50.454, "eval_steps_per_second": 25.227, "step": 3400 }, { "epoch": 8.82, "learning_rate": 3.8720538720538714e-05, "loss": 0.5915, "step": 3500 }, { "epoch": 8.82, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4215960204601288, "eval_runtime": 491.8471, "eval_samples_per_second": 50.512, "eval_steps_per_second": 25.256, "step": 3500 }, { "epoch": 9.07, "learning_rate": 3.03030303030303e-05, "loss": 0.602, "step": 3600 }, { "epoch": 9.07, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4336757957935333, "eval_runtime": 491.8986, "eval_samples_per_second": 50.506, "eval_steps_per_second": 25.253, "step": 3600 }, { "epoch": 9.33, "learning_rate": 2.1885521885521884e-05, "loss": 0.5907, "step": 3700 }, { "epoch": 9.33, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4128669798374176, "eval_runtime": 491.7648, "eval_samples_per_second": 50.52, "eval_steps_per_second": 25.26, "step": 3700 }, { "epoch": 9.58, "learning_rate": 1.3468013468013465e-05, "loss": 0.603, "step": 3800 }, { "epoch": 9.58, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.4216155707836151, "eval_runtime": 491.5621, "eval_samples_per_second": 50.541, "eval_steps_per_second": 25.27, "step": 3800 }, { "epoch": 9.83, "learning_rate": 5.05050505050505e-06, "loss": 0.593, "step": 3900 }, { "epoch": 9.83, "eval_accuracy": 0.8974400257607471, "eval_loss": 0.42267537117004395, "eval_runtime": 491.786, "eval_samples_per_second": 50.518, "eval_steps_per_second": 25.259, "step": 3900 }, { "epoch": 9.98, "step": 3960, "total_flos": 1.5053705916862923e+19, "train_loss": 0.5994764679610127, "train_runtime": 37020.076, "train_samples_per_second": 6.856, "train_steps_per_second": 0.107 } ], "logging_steps": 100, "max_steps": 3960, "num_train_epochs": 10, "save_steps": 100, "total_flos": 1.5053705916862923e+19, "trial_name": null, "trial_params": null }