|
{ |
|
"best_metric": 0.3611119221851426, |
|
"best_model_checkpoint": "t5-small-keyword-generation-inspec\\checkpoint-20000", |
|
"epoch": 20.0, |
|
"global_step": 20000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 4.93e-05, |
|
"loss": 7.9531, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_F1@10": 0.0, |
|
"eval_F1@5": 0.0, |
|
"eval_F1@M": 0.0, |
|
"eval_P@10": 0.0, |
|
"eval_P@5": 0.0, |
|
"eval_P@M": 0.0, |
|
"eval_R@10": 0.0, |
|
"eval_R@5": 0.0, |
|
"eval_R@M": 0.0, |
|
"eval_loss": 4.233538627624512, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 294.894, |
|
"eval_samples_per_second": 1.696, |
|
"eval_steps_per_second": 1.696, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9.93e-05, |
|
"loss": 3.9646, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_F1@10": 0.1977849653076471, |
|
"eval_F1@5": 0.2771428832605307, |
|
"eval_F1@M": 0.3029857823291265, |
|
"eval_P@10": 0.17059999999999995, |
|
"eval_P@5": 0.33559999999999995, |
|
"eval_P@M": 0.42588095238095236, |
|
"eval_R@10": 0.2556045288045292, |
|
"eval_R@5": 0.251349622599623, |
|
"eval_R@M": 0.2556045288045292, |
|
"eval_loss": 2.812638282775879, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 298.6756, |
|
"eval_samples_per_second": 1.674, |
|
"eval_steps_per_second": 1.674, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"learning_rate": 9.899387755102041e-05, |
|
"loss": 2.9718, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_F1@10": 0.21689912919673357, |
|
"eval_F1@5": 0.303470865735572, |
|
"eval_F1@M": 0.3314612888315681, |
|
"eval_P@10": 0.18799999999999992, |
|
"eval_P@5": 0.3703999999999999, |
|
"eval_P@M": 0.4614, |
|
"eval_R@10": 0.2789250194250196, |
|
"eval_R@5": 0.27387566877566905, |
|
"eval_R@M": 0.2789250194250196, |
|
"eval_loss": 2.4728078842163086, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 307.3423, |
|
"eval_samples_per_second": 1.627, |
|
"eval_steps_per_second": 1.627, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 9.79734693877551e-05, |
|
"loss": 2.5763, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_F1@10": 0.21342376898165072, |
|
"eval_F1@5": 0.29715987117457776, |
|
"eval_F1@M": 0.3246857584795672, |
|
"eval_P@10": 0.18480000000000008, |
|
"eval_P@5": 0.3628000000000001, |
|
"eval_P@M": 0.44907619047619074, |
|
"eval_R@10": 0.2744417082917087, |
|
"eval_R@5": 0.2677502941502946, |
|
"eval_R@M": 0.2744417082917087, |
|
"eval_loss": 2.183018445968628, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 289.0824, |
|
"eval_samples_per_second": 1.73, |
|
"eval_steps_per_second": 1.73, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"learning_rate": 9.695510204081633e-05, |
|
"loss": 2.2131, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"eval_F1@10": 0.22083437505943945, |
|
"eval_F1@5": 0.3085772965596502, |
|
"eval_F1@M": 0.33408261078446894, |
|
"eval_P@10": 0.1906, |
|
"eval_P@5": 0.3736000000000001, |
|
"eval_P@M": 0.45226190476190464, |
|
"eval_R@10": 0.2875526029526035, |
|
"eval_R@5": 0.28179986124986167, |
|
"eval_R@M": 0.2875526029526035, |
|
"eval_loss": 2.037614107131958, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 294.2365, |
|
"eval_samples_per_second": 1.699, |
|
"eval_steps_per_second": 1.699, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 9.593469387755103e-05, |
|
"loss": 2.0094, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_F1@10": 0.23622480848222596, |
|
"eval_F1@5": 0.32680995997466633, |
|
"eval_F1@M": 0.3509576027172007, |
|
"eval_P@10": 0.2044, |
|
"eval_P@5": 0.39799999999999996, |
|
"eval_P@M": 0.4652142857142857, |
|
"eval_R@10": 0.30521768231768254, |
|
"eval_R@5": 0.29608175158175193, |
|
"eval_R@M": 0.30521768231768254, |
|
"eval_loss": 1.9597641229629517, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 299.8378, |
|
"eval_samples_per_second": 1.668, |
|
"eval_steps_per_second": 1.668, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 3.5, |
|
"learning_rate": 9.491428571428572e-05, |
|
"loss": 1.7087, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 3.5, |
|
"eval_F1@10": 0.23585947180128827, |
|
"eval_F1@5": 0.32583185474656123, |
|
"eval_F1@M": 0.3484568159051137, |
|
"eval_P@10": 0.20420000000000005, |
|
"eval_P@5": 0.39679999999999993, |
|
"eval_P@M": 0.457257142857143, |
|
"eval_R@10": 0.3021705960705962, |
|
"eval_R@5": 0.2934577533577537, |
|
"eval_R@M": 0.3021705960705962, |
|
"eval_loss": 1.9531850814819336, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 291.44, |
|
"eval_samples_per_second": 1.716, |
|
"eval_steps_per_second": 1.716, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 9.389387755102042e-05, |
|
"loss": 1.7346, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_F1@10": 0.23949844293171174, |
|
"eval_F1@5": 0.3324181589652182, |
|
"eval_F1@M": 0.3555839600200287, |
|
"eval_P@10": 0.20739999999999992, |
|
"eval_P@5": 0.40439999999999987, |
|
"eval_P@M": 0.46959285714285726, |
|
"eval_R@10": 0.307689471639472, |
|
"eval_R@5": 0.30029141969142004, |
|
"eval_R@M": 0.307689471639472, |
|
"eval_loss": 1.8844341039657593, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 279.8232, |
|
"eval_samples_per_second": 1.787, |
|
"eval_steps_per_second": 1.787, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 4.5, |
|
"learning_rate": 9.287551020408164e-05, |
|
"loss": 1.4093, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 4.5, |
|
"eval_F1@10": 0.23374703381451323, |
|
"eval_F1@5": 0.3258455720749842, |
|
"eval_F1@M": 0.34501260196631756, |
|
"eval_P@10": 0.2024, |
|
"eval_P@5": 0.3964, |
|
"eval_P@M": 0.4511738095238098, |
|
"eval_R@10": 0.29999401709401724, |
|
"eval_R@5": 0.2942325452325456, |
|
"eval_R@M": 0.29999401709401724, |
|
"eval_loss": 1.8626010417938232, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 281.3111, |
|
"eval_samples_per_second": 1.777, |
|
"eval_steps_per_second": 1.777, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 9.185510204081633e-05, |
|
"loss": 1.5068, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_F1@10": 0.24335615627100407, |
|
"eval_F1@5": 0.3396655599302659, |
|
"eval_F1@M": 0.3602646628912888, |
|
"eval_P@10": 0.21099999999999977, |
|
"eval_P@5": 0.4139999999999996, |
|
"eval_P@M": 0.4727857142857141, |
|
"eval_R@10": 0.3119000777000777, |
|
"eval_R@5": 0.30657915417915416, |
|
"eval_R@M": 0.3119000777000777, |
|
"eval_loss": 1.7979589700698853, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 280.6796, |
|
"eval_samples_per_second": 1.781, |
|
"eval_steps_per_second": 1.781, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 5.5, |
|
"learning_rate": 9.083469387755103e-05, |
|
"loss": 1.3146, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 5.5, |
|
"eval_F1@10": 0.24001641670200757, |
|
"eval_F1@5": 0.334409038673745, |
|
"eval_F1@M": 0.3550115948035458, |
|
"eval_P@10": 0.20839999999999997, |
|
"eval_P@5": 0.40799999999999986, |
|
"eval_P@M": 0.46737857142857153, |
|
"eval_R@10": 0.30688550338550347, |
|
"eval_R@5": 0.30161761016761024, |
|
"eval_R@M": 0.30688550338550347, |
|
"eval_loss": 1.8715476989746094, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 280.9732, |
|
"eval_samples_per_second": 1.78, |
|
"eval_steps_per_second": 1.78, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 8.981428571428572e-05, |
|
"loss": 1.2704, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_F1@10": 0.24096180425219377, |
|
"eval_F1@5": 0.334974600889307, |
|
"eval_F1@M": 0.35426202280691466, |
|
"eval_P@10": 0.20859999999999995, |
|
"eval_P@5": 0.4076, |
|
"eval_P@M": 0.4599071428571428, |
|
"eval_R@10": 0.30986234321234324, |
|
"eval_R@5": 0.30275404595404604, |
|
"eval_R@M": 0.30986234321234324, |
|
"eval_loss": 1.8688002824783325, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 279.0562, |
|
"eval_samples_per_second": 1.792, |
|
"eval_steps_per_second": 1.792, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 6.5, |
|
"learning_rate": 8.879591836734694e-05, |
|
"loss": 1.1731, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 6.5, |
|
"eval_F1@10": 0.2441899110215107, |
|
"eval_F1@5": 0.3420338693985756, |
|
"eval_F1@M": 0.36420169024302196, |
|
"eval_P@10": 0.2115999999999999, |
|
"eval_P@5": 0.41599999999999987, |
|
"eval_P@M": 0.4780619047619047, |
|
"eval_R@10": 0.31397009102009105, |
|
"eval_R@5": 0.3098475080475081, |
|
"eval_R@M": 0.31397009102009105, |
|
"eval_loss": 1.8536425828933716, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 291.8339, |
|
"eval_samples_per_second": 1.713, |
|
"eval_steps_per_second": 1.713, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 8.777551020408164e-05, |
|
"loss": 1.1174, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_F1@10": 0.24262947404967916, |
|
"eval_F1@5": 0.33894085685556324, |
|
"eval_F1@M": 0.35926122996370713, |
|
"eval_P@10": 0.21039999999999992, |
|
"eval_P@5": 0.4128, |
|
"eval_P@M": 0.46843333333333326, |
|
"eval_R@10": 0.31144045954045946, |
|
"eval_R@5": 0.30653605838605835, |
|
"eval_R@M": 0.31144045954045946, |
|
"eval_loss": 1.8547453880310059, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 293.7424, |
|
"eval_samples_per_second": 1.702, |
|
"eval_steps_per_second": 1.702, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 7.5, |
|
"learning_rate": 8.675510204081633e-05, |
|
"loss": 1.0319, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 7.5, |
|
"eval_F1@10": 0.24435341427092733, |
|
"eval_F1@5": 0.34094378497319694, |
|
"eval_F1@M": 0.36301657635450263, |
|
"eval_P@10": 0.21159999999999995, |
|
"eval_P@5": 0.4139999999999999, |
|
"eval_P@M": 0.4739333333333334, |
|
"eval_R@10": 0.31494397269397284, |
|
"eval_R@5": 0.30938704628704644, |
|
"eval_R@M": 0.31494397269397284, |
|
"eval_loss": 1.8866732120513916, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 298.9317, |
|
"eval_samples_per_second": 1.673, |
|
"eval_steps_per_second": 1.673, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 8.573469387755101e-05, |
|
"loss": 1.0172, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_F1@10": 0.2461478679992482, |
|
"eval_F1@5": 0.34169924781101274, |
|
"eval_F1@M": 0.36424212479986534, |
|
"eval_P@10": 0.21280000000000002, |
|
"eval_P@5": 0.41439999999999994, |
|
"eval_P@M": 0.47244523809523775, |
|
"eval_R@10": 0.3185173215673219, |
|
"eval_R@5": 0.3108509435009436, |
|
"eval_R@M": 0.3185173215673219, |
|
"eval_loss": 1.9575016498565674, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 264.7319, |
|
"eval_samples_per_second": 1.889, |
|
"eval_steps_per_second": 1.889, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 8.5, |
|
"learning_rate": 8.471632653061225e-05, |
|
"loss": 0.9324, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 8.5, |
|
"eval_F1@10": 0.23868666530445426, |
|
"eval_F1@5": 0.3324125028566208, |
|
"eval_F1@M": 0.3539066449202676, |
|
"eval_P@10": 0.20719999999999994, |
|
"eval_P@5": 0.4051999999999999, |
|
"eval_P@M": 0.46190476190476165, |
|
"eval_R@10": 0.3066111166611168, |
|
"eval_R@5": 0.3009154456654457, |
|
"eval_R@M": 0.3066111166611168, |
|
"eval_loss": 1.9488437175750732, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 286.0434, |
|
"eval_samples_per_second": 1.748, |
|
"eval_steps_per_second": 1.748, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 8.369591836734695e-05, |
|
"loss": 0.9587, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_F1@10": 0.23996280126000177, |
|
"eval_F1@5": 0.33370613928555143, |
|
"eval_F1@M": 0.3559531203402726, |
|
"eval_P@10": 0.20799999999999982, |
|
"eval_P@5": 0.4059999999999997, |
|
"eval_P@M": 0.4660785714285711, |
|
"eval_R@10": 0.30781457986458, |
|
"eval_R@5": 0.30168088578088587, |
|
"eval_R@M": 0.30781457986458, |
|
"eval_loss": 1.9363871812820435, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 282.9341, |
|
"eval_samples_per_second": 1.767, |
|
"eval_steps_per_second": 1.767, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 9.5, |
|
"learning_rate": 8.267551020408164e-05, |
|
"loss": 0.8864, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 9.5, |
|
"eval_F1@10": 0.24553398899899156, |
|
"eval_F1@5": 0.33974727821198425, |
|
"eval_F1@M": 0.36148470868656674, |
|
"eval_P@10": 0.21259999999999998, |
|
"eval_P@5": 0.4128, |
|
"eval_P@M": 0.46541666666666653, |
|
"eval_R@10": 0.3148071484071486, |
|
"eval_R@5": 0.3069217227217229, |
|
"eval_R@M": 0.3148071484071486, |
|
"eval_loss": 2.0047595500946045, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 283.5357, |
|
"eval_samples_per_second": 1.763, |
|
"eval_steps_per_second": 1.763, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 8.165510204081634e-05, |
|
"loss": 0.8219, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_F1@10": 0.24542163861026467, |
|
"eval_F1@5": 0.3405659428806491, |
|
"eval_F1@M": 0.36243521048954536, |
|
"eval_P@10": 0.2128, |
|
"eval_P@5": 0.4147999999999997, |
|
"eval_P@M": 0.471490476190476, |
|
"eval_R@10": 0.31549298479298493, |
|
"eval_R@5": 0.30797812187812196, |
|
"eval_R@M": 0.31549298479298493, |
|
"eval_loss": 2.050034999847412, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 284.698, |
|
"eval_samples_per_second": 1.756, |
|
"eval_steps_per_second": 1.756, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 10.5, |
|
"learning_rate": 8.063469387755103e-05, |
|
"loss": 0.7906, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 10.5, |
|
"eval_F1@10": 0.24112739408629902, |
|
"eval_F1@5": 0.3361905365875957, |
|
"eval_F1@M": 0.35434909789213215, |
|
"eval_P@10": 0.20859999999999984, |
|
"eval_P@5": 0.4083999999999998, |
|
"eval_P@M": 0.4588999999999998, |
|
"eval_R@10": 0.3117027250527253, |
|
"eval_R@5": 0.3052405316905319, |
|
"eval_R@M": 0.3117027250527253, |
|
"eval_loss": 2.076453685760498, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 283.1972, |
|
"eval_samples_per_second": 1.766, |
|
"eval_steps_per_second": 1.766, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 7.961632653061225e-05, |
|
"loss": 0.7828, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_F1@10": 0.2434173157573352, |
|
"eval_F1@5": 0.3369145302410012, |
|
"eval_F1@M": 0.35818623186239346, |
|
"eval_P@10": 0.21079999999999996, |
|
"eval_P@5": 0.40959999999999974, |
|
"eval_P@M": 0.4597690476190474, |
|
"eval_R@10": 0.3140421911421914, |
|
"eval_R@5": 0.3053971694971696, |
|
"eval_R@M": 0.3140421911421914, |
|
"eval_loss": 2.0442428588867188, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 283.6328, |
|
"eval_samples_per_second": 1.763, |
|
"eval_steps_per_second": 1.763, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 11.5, |
|
"learning_rate": 7.859795918367348e-05, |
|
"loss": 0.7724, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 11.5, |
|
"eval_F1@10": 0.24332780944321591, |
|
"eval_F1@5": 0.3358317365640898, |
|
"eval_F1@M": 0.3594637432399048, |
|
"eval_P@10": 0.21079999999999996, |
|
"eval_P@5": 0.40799999999999986, |
|
"eval_P@M": 0.4666904761904761, |
|
"eval_R@10": 0.31255604395604414, |
|
"eval_R@5": 0.3039292041292042, |
|
"eval_R@M": 0.31255604395604414, |
|
"eval_loss": 2.1262500286102295, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 283.3582, |
|
"eval_samples_per_second": 1.765, |
|
"eval_steps_per_second": 1.765, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 7.757755102040817e-05, |
|
"loss": 0.6985, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_F1@10": 0.24282010444872945, |
|
"eval_F1@5": 0.33782710328886834, |
|
"eval_F1@M": 0.35967159486540345, |
|
"eval_P@10": 0.2104, |
|
"eval_P@5": 0.4112, |
|
"eval_P@M": 0.4646380952380953, |
|
"eval_R@10": 0.31213939948939956, |
|
"eval_R@5": 0.30527879342879344, |
|
"eval_R@M": 0.31213939948939956, |
|
"eval_loss": 2.0867960453033447, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 281.5635, |
|
"eval_samples_per_second": 1.776, |
|
"eval_steps_per_second": 1.776, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"learning_rate": 7.655714285714286e-05, |
|
"loss": 0.6647, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"eval_F1@10": 0.24765508121946467, |
|
"eval_F1@5": 0.3433662775133368, |
|
"eval_F1@M": 0.3637068867664847, |
|
"eval_P@10": 0.21459999999999982, |
|
"eval_P@5": 0.4179999999999996, |
|
"eval_P@M": 0.4680285714285711, |
|
"eval_R@10": 0.3187178987678989, |
|
"eval_R@5": 0.3105277833277834, |
|
"eval_R@M": 0.3187178987678989, |
|
"eval_loss": 2.156297445297241, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 281.7625, |
|
"eval_samples_per_second": 1.775, |
|
"eval_steps_per_second": 1.775, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 7.553673469387756e-05, |
|
"loss": 0.6823, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_F1@10": 0.25070757222690915, |
|
"eval_F1@5": 0.34642384380325597, |
|
"eval_F1@M": 0.36789754023066784, |
|
"eval_P@10": 0.21759999999999993, |
|
"eval_P@5": 0.4223999999999997, |
|
"eval_P@M": 0.47199523809523813, |
|
"eval_R@10": 0.3204831224331225, |
|
"eval_R@5": 0.3122700632700633, |
|
"eval_R@M": 0.3204831224331225, |
|
"eval_loss": 2.154297113418579, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 283.3444, |
|
"eval_samples_per_second": 1.765, |
|
"eval_steps_per_second": 1.765, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 13.5, |
|
"learning_rate": 7.451632653061224e-05, |
|
"loss": 0.6039, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 13.5, |
|
"eval_F1@10": 0.24724974591747426, |
|
"eval_F1@5": 0.34381850469791675, |
|
"eval_F1@M": 0.36370015266810973, |
|
"eval_P@10": 0.21420000000000003, |
|
"eval_P@5": 0.4179999999999999, |
|
"eval_P@M": 0.4715571428571432, |
|
"eval_R@10": 0.31813237873237904, |
|
"eval_R@5": 0.31155258075258097, |
|
"eval_R@M": 0.31813237873237904, |
|
"eval_loss": 2.273547410964966, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 282.8458, |
|
"eval_samples_per_second": 1.768, |
|
"eval_steps_per_second": 1.768, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 7.349591836734695e-05, |
|
"loss": 0.6657, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_F1@10": 0.24294545526488653, |
|
"eval_F1@5": 0.33743259452965385, |
|
"eval_F1@M": 0.35771661821151046, |
|
"eval_P@10": 0.21059999999999995, |
|
"eval_P@5": 0.4103999999999999, |
|
"eval_P@M": 0.4632714285714285, |
|
"eval_R@10": 0.3123259573759575, |
|
"eval_R@5": 0.3057819458319459, |
|
"eval_R@M": 0.3123259573759575, |
|
"eval_loss": 2.2293343544006348, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 284.7498, |
|
"eval_samples_per_second": 1.756, |
|
"eval_steps_per_second": 1.756, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 14.5, |
|
"learning_rate": 7.247551020408163e-05, |
|
"loss": 0.5512, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 14.5, |
|
"eval_F1@10": 0.24609090645971843, |
|
"eval_F1@5": 0.341195668057433, |
|
"eval_F1@M": 0.3638307651069263, |
|
"eval_P@10": 0.2134, |
|
"eval_P@5": 0.4151999999999999, |
|
"eval_P@M": 0.47303809523809526, |
|
"eval_R@10": 0.31571549561549583, |
|
"eval_R@5": 0.3083380064380067, |
|
"eval_R@M": 0.31571549561549583, |
|
"eval_loss": 2.2570900917053223, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 289.2337, |
|
"eval_samples_per_second": 1.729, |
|
"eval_steps_per_second": 1.729, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"learning_rate": 7.145510204081633e-05, |
|
"loss": 0.6125, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_F1@10": 0.24506923303510375, |
|
"eval_F1@5": 0.34101718379659585, |
|
"eval_F1@M": 0.36054259558810675, |
|
"eval_P@10": 0.21240000000000006, |
|
"eval_P@5": 0.41520000000000007, |
|
"eval_P@M": 0.46649523809523824, |
|
"eval_R@10": 0.3145362748362751, |
|
"eval_R@5": 0.30819146964146976, |
|
"eval_R@M": 0.3145362748362751, |
|
"eval_loss": 2.300617218017578, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 285.2317, |
|
"eval_samples_per_second": 1.753, |
|
"eval_steps_per_second": 1.753, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 15.5, |
|
"learning_rate": 7.043673469387755e-05, |
|
"loss": 0.5785, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 15.5, |
|
"eval_F1@10": 0.2442251260644657, |
|
"eval_F1@5": 0.33893644394820904, |
|
"eval_F1@M": 0.35870379697701743, |
|
"eval_P@10": 0.21159999999999998, |
|
"eval_P@5": 0.41240000000000004, |
|
"eval_P@M": 0.46347380952380973, |
|
"eval_R@10": 0.3134413031413033, |
|
"eval_R@5": 0.3057845210345211, |
|
"eval_R@M": 0.3134413031413033, |
|
"eval_loss": 2.338202953338623, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 289.9816, |
|
"eval_samples_per_second": 1.724, |
|
"eval_steps_per_second": 1.724, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 6.941632653061226e-05, |
|
"loss": 0.5428, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_F1@10": 0.2432725372472316, |
|
"eval_F1@5": 0.3373570716864839, |
|
"eval_F1@M": 0.3582228556960761, |
|
"eval_P@10": 0.21059999999999998, |
|
"eval_P@5": 0.4095999999999998, |
|
"eval_P@M": 0.46375, |
|
"eval_R@10": 0.3134618159618162, |
|
"eval_R@5": 0.30584154179154194, |
|
"eval_R@M": 0.3134618159618162, |
|
"eval_loss": 2.3253493309020996, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 289.4094, |
|
"eval_samples_per_second": 1.728, |
|
"eval_steps_per_second": 1.728, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 16.5, |
|
"learning_rate": 6.839591836734694e-05, |
|
"loss": 0.5194, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 16.5, |
|
"eval_F1@10": 0.2355793420179682, |
|
"eval_F1@5": 0.3278029424823546, |
|
"eval_F1@M": 0.3482424748282339, |
|
"eval_P@10": 0.20440000000000003, |
|
"eval_P@5": 0.3991999999999999, |
|
"eval_P@M": 0.4537833333333335, |
|
"eval_R@10": 0.30187379287379296, |
|
"eval_R@5": 0.2962392329892331, |
|
"eval_R@M": 0.30187379287379296, |
|
"eval_loss": 2.3528101444244385, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 290.7706, |
|
"eval_samples_per_second": 1.72, |
|
"eval_steps_per_second": 1.72, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"learning_rate": 6.737551020408163e-05, |
|
"loss": 0.5194, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_F1@10": 0.24069023813939067, |
|
"eval_F1@5": 0.33479577971048596, |
|
"eval_F1@M": 0.355847497067776, |
|
"eval_P@10": 0.20800000000000002, |
|
"eval_P@5": 0.40559999999999996, |
|
"eval_P@M": 0.46179999999999993, |
|
"eval_R@10": 0.311403085803086, |
|
"eval_R@5": 0.3045922632922635, |
|
"eval_R@M": 0.311403085803086, |
|
"eval_loss": 2.3786723613739014, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 272.2042, |
|
"eval_samples_per_second": 1.837, |
|
"eval_steps_per_second": 1.837, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 17.5, |
|
"learning_rate": 6.635510204081633e-05, |
|
"loss": 0.4734, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 17.5, |
|
"eval_F1@10": 0.2424905535962076, |
|
"eval_F1@5": 0.33929873949579886, |
|
"eval_F1@M": 0.36014400369152755, |
|
"eval_P@10": 0.20979999999999996, |
|
"eval_P@5": 0.4119999999999998, |
|
"eval_P@M": 0.46821190476190494, |
|
"eval_R@10": 0.3125397380397382, |
|
"eval_R@5": 0.3077346153846155, |
|
"eval_R@M": 0.3125397380397382, |
|
"eval_loss": 2.3801848888397217, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 269.1685, |
|
"eval_samples_per_second": 1.858, |
|
"eval_steps_per_second": 1.858, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"learning_rate": 6.533469387755102e-05, |
|
"loss": 0.4685, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_F1@10": 0.2428809489937239, |
|
"eval_F1@5": 0.34102215725451057, |
|
"eval_F1@M": 0.36136990799018703, |
|
"eval_P@10": 0.20919999999999994, |
|
"eval_P@5": 0.41119999999999984, |
|
"eval_P@M": 0.4681333333333333, |
|
"eval_R@10": 0.31634897324897343, |
|
"eval_R@5": 0.31194796314796325, |
|
"eval_R@M": 0.31634897324897343, |
|
"eval_loss": 2.4091179370880127, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 264.9477, |
|
"eval_samples_per_second": 1.887, |
|
"eval_steps_per_second": 1.887, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 18.5, |
|
"learning_rate": 6.431428571428572e-05, |
|
"loss": 0.4574, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 18.5, |
|
"eval_F1@10": 0.24470615952450722, |
|
"eval_F1@5": 0.34083279204455713, |
|
"eval_F1@M": 0.3591474804177593, |
|
"eval_P@10": 0.21199999999999997, |
|
"eval_P@5": 0.41440000000000005, |
|
"eval_P@M": 0.46359047619047605, |
|
"eval_R@10": 0.31490344655344676, |
|
"eval_R@5": 0.30879514929514945, |
|
"eval_R@M": 0.31490344655344676, |
|
"eval_loss": 2.414991617202759, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 289.5904, |
|
"eval_samples_per_second": 1.727, |
|
"eval_steps_per_second": 1.727, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"learning_rate": 6.329387755102041e-05, |
|
"loss": 0.4411, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_F1@10": 0.2413860020074456, |
|
"eval_F1@5": 0.3365299011446076, |
|
"eval_F1@M": 0.3552537179710558, |
|
"eval_P@10": 0.20879999999999999, |
|
"eval_P@5": 0.4083999999999998, |
|
"eval_P@M": 0.4593714285714285, |
|
"eval_R@10": 0.31052307137307145, |
|
"eval_R@5": 0.3046235042735043, |
|
"eval_R@M": 0.31052307137307145, |
|
"eval_loss": 2.5369248390197754, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 281.7996, |
|
"eval_samples_per_second": 1.774, |
|
"eval_steps_per_second": 1.774, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 19.5, |
|
"learning_rate": 6.22734693877551e-05, |
|
"loss": 0.4032, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 19.5, |
|
"eval_F1@10": 0.2432083462438766, |
|
"eval_F1@5": 0.3403430030753566, |
|
"eval_F1@M": 0.35755804044596656, |
|
"eval_P@10": 0.2102, |
|
"eval_P@5": 0.4132000000000002, |
|
"eval_P@M": 0.4617999999999998, |
|
"eval_R@10": 0.3141284104784106, |
|
"eval_R@5": 0.30864017094017104, |
|
"eval_R@M": 0.3141284104784106, |
|
"eval_loss": 2.560804605484009, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 296.5123, |
|
"eval_samples_per_second": 1.686, |
|
"eval_steps_per_second": 1.686, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 6.125510204081633e-05, |
|
"loss": 0.4402, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_F1@10": 0.24569117638243435, |
|
"eval_F1@5": 0.3409062858709922, |
|
"eval_F1@M": 0.3611119221851426, |
|
"eval_P@10": 0.21239999999999998, |
|
"eval_P@5": 0.41359999999999997, |
|
"eval_P@M": 0.4668095238095235, |
|
"eval_R@10": 0.3174460150960153, |
|
"eval_R@5": 0.3095908924408926, |
|
"eval_R@M": 0.3174460150960153, |
|
"eval_loss": 2.5116209983825684, |
|
"eval_model_name": "t5-small-keyword-generation-inspec", |
|
"eval_runtime": 280.4633, |
|
"eval_samples_per_second": 1.783, |
|
"eval_steps_per_second": 1.783, |
|
"step": 20000 |
|
} |
|
], |
|
"max_steps": 50000, |
|
"num_train_epochs": 50, |
|
"total_flos": 2706836029440000.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|