Thomas De Decker
Add model
2b941d3
raw
history blame
29.6 kB
{
"best_metric": 0.3611119221851426,
"best_model_checkpoint": "t5-small-keyword-generation-inspec\\checkpoint-20000",
"epoch": 20.0,
"global_step": 20000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.5,
"learning_rate": 4.93e-05,
"loss": 7.9531,
"step": 500
},
{
"epoch": 0.5,
"eval_F1@10": 0.0,
"eval_F1@5": 0.0,
"eval_F1@M": 0.0,
"eval_P@10": 0.0,
"eval_P@5": 0.0,
"eval_P@M": 0.0,
"eval_R@10": 0.0,
"eval_R@5": 0.0,
"eval_R@M": 0.0,
"eval_loss": 4.233538627624512,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 294.894,
"eval_samples_per_second": 1.696,
"eval_steps_per_second": 1.696,
"step": 500
},
{
"epoch": 1.0,
"learning_rate": 9.93e-05,
"loss": 3.9646,
"step": 1000
},
{
"epoch": 1.0,
"eval_F1@10": 0.1977849653076471,
"eval_F1@5": 0.2771428832605307,
"eval_F1@M": 0.3029857823291265,
"eval_P@10": 0.17059999999999995,
"eval_P@5": 0.33559999999999995,
"eval_P@M": 0.42588095238095236,
"eval_R@10": 0.2556045288045292,
"eval_R@5": 0.251349622599623,
"eval_R@M": 0.2556045288045292,
"eval_loss": 2.812638282775879,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 298.6756,
"eval_samples_per_second": 1.674,
"eval_steps_per_second": 1.674,
"step": 1000
},
{
"epoch": 1.5,
"learning_rate": 9.899387755102041e-05,
"loss": 2.9718,
"step": 1500
},
{
"epoch": 1.5,
"eval_F1@10": 0.21689912919673357,
"eval_F1@5": 0.303470865735572,
"eval_F1@M": 0.3314612888315681,
"eval_P@10": 0.18799999999999992,
"eval_P@5": 0.3703999999999999,
"eval_P@M": 0.4614,
"eval_R@10": 0.2789250194250196,
"eval_R@5": 0.27387566877566905,
"eval_R@M": 0.2789250194250196,
"eval_loss": 2.4728078842163086,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 307.3423,
"eval_samples_per_second": 1.627,
"eval_steps_per_second": 1.627,
"step": 1500
},
{
"epoch": 2.0,
"learning_rate": 9.79734693877551e-05,
"loss": 2.5763,
"step": 2000
},
{
"epoch": 2.0,
"eval_F1@10": 0.21342376898165072,
"eval_F1@5": 0.29715987117457776,
"eval_F1@M": 0.3246857584795672,
"eval_P@10": 0.18480000000000008,
"eval_P@5": 0.3628000000000001,
"eval_P@M": 0.44907619047619074,
"eval_R@10": 0.2744417082917087,
"eval_R@5": 0.2677502941502946,
"eval_R@M": 0.2744417082917087,
"eval_loss": 2.183018445968628,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 289.0824,
"eval_samples_per_second": 1.73,
"eval_steps_per_second": 1.73,
"step": 2000
},
{
"epoch": 2.5,
"learning_rate": 9.695510204081633e-05,
"loss": 2.2131,
"step": 2500
},
{
"epoch": 2.5,
"eval_F1@10": 0.22083437505943945,
"eval_F1@5": 0.3085772965596502,
"eval_F1@M": 0.33408261078446894,
"eval_P@10": 0.1906,
"eval_P@5": 0.3736000000000001,
"eval_P@M": 0.45226190476190464,
"eval_R@10": 0.2875526029526035,
"eval_R@5": 0.28179986124986167,
"eval_R@M": 0.2875526029526035,
"eval_loss": 2.037614107131958,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 294.2365,
"eval_samples_per_second": 1.699,
"eval_steps_per_second": 1.699,
"step": 2500
},
{
"epoch": 3.0,
"learning_rate": 9.593469387755103e-05,
"loss": 2.0094,
"step": 3000
},
{
"epoch": 3.0,
"eval_F1@10": 0.23622480848222596,
"eval_F1@5": 0.32680995997466633,
"eval_F1@M": 0.3509576027172007,
"eval_P@10": 0.2044,
"eval_P@5": 0.39799999999999996,
"eval_P@M": 0.4652142857142857,
"eval_R@10": 0.30521768231768254,
"eval_R@5": 0.29608175158175193,
"eval_R@M": 0.30521768231768254,
"eval_loss": 1.9597641229629517,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 299.8378,
"eval_samples_per_second": 1.668,
"eval_steps_per_second": 1.668,
"step": 3000
},
{
"epoch": 3.5,
"learning_rate": 9.491428571428572e-05,
"loss": 1.7087,
"step": 3500
},
{
"epoch": 3.5,
"eval_F1@10": 0.23585947180128827,
"eval_F1@5": 0.32583185474656123,
"eval_F1@M": 0.3484568159051137,
"eval_P@10": 0.20420000000000005,
"eval_P@5": 0.39679999999999993,
"eval_P@M": 0.457257142857143,
"eval_R@10": 0.3021705960705962,
"eval_R@5": 0.2934577533577537,
"eval_R@M": 0.3021705960705962,
"eval_loss": 1.9531850814819336,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 291.44,
"eval_samples_per_second": 1.716,
"eval_steps_per_second": 1.716,
"step": 3500
},
{
"epoch": 4.0,
"learning_rate": 9.389387755102042e-05,
"loss": 1.7346,
"step": 4000
},
{
"epoch": 4.0,
"eval_F1@10": 0.23949844293171174,
"eval_F1@5": 0.3324181589652182,
"eval_F1@M": 0.3555839600200287,
"eval_P@10": 0.20739999999999992,
"eval_P@5": 0.40439999999999987,
"eval_P@M": 0.46959285714285726,
"eval_R@10": 0.307689471639472,
"eval_R@5": 0.30029141969142004,
"eval_R@M": 0.307689471639472,
"eval_loss": 1.8844341039657593,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 279.8232,
"eval_samples_per_second": 1.787,
"eval_steps_per_second": 1.787,
"step": 4000
},
{
"epoch": 4.5,
"learning_rate": 9.287551020408164e-05,
"loss": 1.4093,
"step": 4500
},
{
"epoch": 4.5,
"eval_F1@10": 0.23374703381451323,
"eval_F1@5": 0.3258455720749842,
"eval_F1@M": 0.34501260196631756,
"eval_P@10": 0.2024,
"eval_P@5": 0.3964,
"eval_P@M": 0.4511738095238098,
"eval_R@10": 0.29999401709401724,
"eval_R@5": 0.2942325452325456,
"eval_R@M": 0.29999401709401724,
"eval_loss": 1.8626010417938232,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 281.3111,
"eval_samples_per_second": 1.777,
"eval_steps_per_second": 1.777,
"step": 4500
},
{
"epoch": 5.0,
"learning_rate": 9.185510204081633e-05,
"loss": 1.5068,
"step": 5000
},
{
"epoch": 5.0,
"eval_F1@10": 0.24335615627100407,
"eval_F1@5": 0.3396655599302659,
"eval_F1@M": 0.3602646628912888,
"eval_P@10": 0.21099999999999977,
"eval_P@5": 0.4139999999999996,
"eval_P@M": 0.4727857142857141,
"eval_R@10": 0.3119000777000777,
"eval_R@5": 0.30657915417915416,
"eval_R@M": 0.3119000777000777,
"eval_loss": 1.7979589700698853,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 280.6796,
"eval_samples_per_second": 1.781,
"eval_steps_per_second": 1.781,
"step": 5000
},
{
"epoch": 5.5,
"learning_rate": 9.083469387755103e-05,
"loss": 1.3146,
"step": 5500
},
{
"epoch": 5.5,
"eval_F1@10": 0.24001641670200757,
"eval_F1@5": 0.334409038673745,
"eval_F1@M": 0.3550115948035458,
"eval_P@10": 0.20839999999999997,
"eval_P@5": 0.40799999999999986,
"eval_P@M": 0.46737857142857153,
"eval_R@10": 0.30688550338550347,
"eval_R@5": 0.30161761016761024,
"eval_R@M": 0.30688550338550347,
"eval_loss": 1.8715476989746094,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 280.9732,
"eval_samples_per_second": 1.78,
"eval_steps_per_second": 1.78,
"step": 5500
},
{
"epoch": 6.0,
"learning_rate": 8.981428571428572e-05,
"loss": 1.2704,
"step": 6000
},
{
"epoch": 6.0,
"eval_F1@10": 0.24096180425219377,
"eval_F1@5": 0.334974600889307,
"eval_F1@M": 0.35426202280691466,
"eval_P@10": 0.20859999999999995,
"eval_P@5": 0.4076,
"eval_P@M": 0.4599071428571428,
"eval_R@10": 0.30986234321234324,
"eval_R@5": 0.30275404595404604,
"eval_R@M": 0.30986234321234324,
"eval_loss": 1.8688002824783325,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 279.0562,
"eval_samples_per_second": 1.792,
"eval_steps_per_second": 1.792,
"step": 6000
},
{
"epoch": 6.5,
"learning_rate": 8.879591836734694e-05,
"loss": 1.1731,
"step": 6500
},
{
"epoch": 6.5,
"eval_F1@10": 0.2441899110215107,
"eval_F1@5": 0.3420338693985756,
"eval_F1@M": 0.36420169024302196,
"eval_P@10": 0.2115999999999999,
"eval_P@5": 0.41599999999999987,
"eval_P@M": 0.4780619047619047,
"eval_R@10": 0.31397009102009105,
"eval_R@5": 0.3098475080475081,
"eval_R@M": 0.31397009102009105,
"eval_loss": 1.8536425828933716,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 291.8339,
"eval_samples_per_second": 1.713,
"eval_steps_per_second": 1.713,
"step": 6500
},
{
"epoch": 7.0,
"learning_rate": 8.777551020408164e-05,
"loss": 1.1174,
"step": 7000
},
{
"epoch": 7.0,
"eval_F1@10": 0.24262947404967916,
"eval_F1@5": 0.33894085685556324,
"eval_F1@M": 0.35926122996370713,
"eval_P@10": 0.21039999999999992,
"eval_P@5": 0.4128,
"eval_P@M": 0.46843333333333326,
"eval_R@10": 0.31144045954045946,
"eval_R@5": 0.30653605838605835,
"eval_R@M": 0.31144045954045946,
"eval_loss": 1.8547453880310059,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 293.7424,
"eval_samples_per_second": 1.702,
"eval_steps_per_second": 1.702,
"step": 7000
},
{
"epoch": 7.5,
"learning_rate": 8.675510204081633e-05,
"loss": 1.0319,
"step": 7500
},
{
"epoch": 7.5,
"eval_F1@10": 0.24435341427092733,
"eval_F1@5": 0.34094378497319694,
"eval_F1@M": 0.36301657635450263,
"eval_P@10": 0.21159999999999995,
"eval_P@5": 0.4139999999999999,
"eval_P@M": 0.4739333333333334,
"eval_R@10": 0.31494397269397284,
"eval_R@5": 0.30938704628704644,
"eval_R@M": 0.31494397269397284,
"eval_loss": 1.8866732120513916,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 298.9317,
"eval_samples_per_second": 1.673,
"eval_steps_per_second": 1.673,
"step": 7500
},
{
"epoch": 8.0,
"learning_rate": 8.573469387755101e-05,
"loss": 1.0172,
"step": 8000
},
{
"epoch": 8.0,
"eval_F1@10": 0.2461478679992482,
"eval_F1@5": 0.34169924781101274,
"eval_F1@M": 0.36424212479986534,
"eval_P@10": 0.21280000000000002,
"eval_P@5": 0.41439999999999994,
"eval_P@M": 0.47244523809523775,
"eval_R@10": 0.3185173215673219,
"eval_R@5": 0.3108509435009436,
"eval_R@M": 0.3185173215673219,
"eval_loss": 1.9575016498565674,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 264.7319,
"eval_samples_per_second": 1.889,
"eval_steps_per_second": 1.889,
"step": 8000
},
{
"epoch": 8.5,
"learning_rate": 8.471632653061225e-05,
"loss": 0.9324,
"step": 8500
},
{
"epoch": 8.5,
"eval_F1@10": 0.23868666530445426,
"eval_F1@5": 0.3324125028566208,
"eval_F1@M": 0.3539066449202676,
"eval_P@10": 0.20719999999999994,
"eval_P@5": 0.4051999999999999,
"eval_P@M": 0.46190476190476165,
"eval_R@10": 0.3066111166611168,
"eval_R@5": 0.3009154456654457,
"eval_R@M": 0.3066111166611168,
"eval_loss": 1.9488437175750732,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 286.0434,
"eval_samples_per_second": 1.748,
"eval_steps_per_second": 1.748,
"step": 8500
},
{
"epoch": 9.0,
"learning_rate": 8.369591836734695e-05,
"loss": 0.9587,
"step": 9000
},
{
"epoch": 9.0,
"eval_F1@10": 0.23996280126000177,
"eval_F1@5": 0.33370613928555143,
"eval_F1@M": 0.3559531203402726,
"eval_P@10": 0.20799999999999982,
"eval_P@5": 0.4059999999999997,
"eval_P@M": 0.4660785714285711,
"eval_R@10": 0.30781457986458,
"eval_R@5": 0.30168088578088587,
"eval_R@M": 0.30781457986458,
"eval_loss": 1.9363871812820435,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 282.9341,
"eval_samples_per_second": 1.767,
"eval_steps_per_second": 1.767,
"step": 9000
},
{
"epoch": 9.5,
"learning_rate": 8.267551020408164e-05,
"loss": 0.8864,
"step": 9500
},
{
"epoch": 9.5,
"eval_F1@10": 0.24553398899899156,
"eval_F1@5": 0.33974727821198425,
"eval_F1@M": 0.36148470868656674,
"eval_P@10": 0.21259999999999998,
"eval_P@5": 0.4128,
"eval_P@M": 0.46541666666666653,
"eval_R@10": 0.3148071484071486,
"eval_R@5": 0.3069217227217229,
"eval_R@M": 0.3148071484071486,
"eval_loss": 2.0047595500946045,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 283.5357,
"eval_samples_per_second": 1.763,
"eval_steps_per_second": 1.763,
"step": 9500
},
{
"epoch": 10.0,
"learning_rate": 8.165510204081634e-05,
"loss": 0.8219,
"step": 10000
},
{
"epoch": 10.0,
"eval_F1@10": 0.24542163861026467,
"eval_F1@5": 0.3405659428806491,
"eval_F1@M": 0.36243521048954536,
"eval_P@10": 0.2128,
"eval_P@5": 0.4147999999999997,
"eval_P@M": 0.471490476190476,
"eval_R@10": 0.31549298479298493,
"eval_R@5": 0.30797812187812196,
"eval_R@M": 0.31549298479298493,
"eval_loss": 2.050034999847412,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 284.698,
"eval_samples_per_second": 1.756,
"eval_steps_per_second": 1.756,
"step": 10000
},
{
"epoch": 10.5,
"learning_rate": 8.063469387755103e-05,
"loss": 0.7906,
"step": 10500
},
{
"epoch": 10.5,
"eval_F1@10": 0.24112739408629902,
"eval_F1@5": 0.3361905365875957,
"eval_F1@M": 0.35434909789213215,
"eval_P@10": 0.20859999999999984,
"eval_P@5": 0.4083999999999998,
"eval_P@M": 0.4588999999999998,
"eval_R@10": 0.3117027250527253,
"eval_R@5": 0.3052405316905319,
"eval_R@M": 0.3117027250527253,
"eval_loss": 2.076453685760498,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 283.1972,
"eval_samples_per_second": 1.766,
"eval_steps_per_second": 1.766,
"step": 10500
},
{
"epoch": 11.0,
"learning_rate": 7.961632653061225e-05,
"loss": 0.7828,
"step": 11000
},
{
"epoch": 11.0,
"eval_F1@10": 0.2434173157573352,
"eval_F1@5": 0.3369145302410012,
"eval_F1@M": 0.35818623186239346,
"eval_P@10": 0.21079999999999996,
"eval_P@5": 0.40959999999999974,
"eval_P@M": 0.4597690476190474,
"eval_R@10": 0.3140421911421914,
"eval_R@5": 0.3053971694971696,
"eval_R@M": 0.3140421911421914,
"eval_loss": 2.0442428588867188,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 283.6328,
"eval_samples_per_second": 1.763,
"eval_steps_per_second": 1.763,
"step": 11000
},
{
"epoch": 11.5,
"learning_rate": 7.859795918367348e-05,
"loss": 0.7724,
"step": 11500
},
{
"epoch": 11.5,
"eval_F1@10": 0.24332780944321591,
"eval_F1@5": 0.3358317365640898,
"eval_F1@M": 0.3594637432399048,
"eval_P@10": 0.21079999999999996,
"eval_P@5": 0.40799999999999986,
"eval_P@M": 0.4666904761904761,
"eval_R@10": 0.31255604395604414,
"eval_R@5": 0.3039292041292042,
"eval_R@M": 0.31255604395604414,
"eval_loss": 2.1262500286102295,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 283.3582,
"eval_samples_per_second": 1.765,
"eval_steps_per_second": 1.765,
"step": 11500
},
{
"epoch": 12.0,
"learning_rate": 7.757755102040817e-05,
"loss": 0.6985,
"step": 12000
},
{
"epoch": 12.0,
"eval_F1@10": 0.24282010444872945,
"eval_F1@5": 0.33782710328886834,
"eval_F1@M": 0.35967159486540345,
"eval_P@10": 0.2104,
"eval_P@5": 0.4112,
"eval_P@M": 0.4646380952380953,
"eval_R@10": 0.31213939948939956,
"eval_R@5": 0.30527879342879344,
"eval_R@M": 0.31213939948939956,
"eval_loss": 2.0867960453033447,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 281.5635,
"eval_samples_per_second": 1.776,
"eval_steps_per_second": 1.776,
"step": 12000
},
{
"epoch": 12.5,
"learning_rate": 7.655714285714286e-05,
"loss": 0.6647,
"step": 12500
},
{
"epoch": 12.5,
"eval_F1@10": 0.24765508121946467,
"eval_F1@5": 0.3433662775133368,
"eval_F1@M": 0.3637068867664847,
"eval_P@10": 0.21459999999999982,
"eval_P@5": 0.4179999999999996,
"eval_P@M": 0.4680285714285711,
"eval_R@10": 0.3187178987678989,
"eval_R@5": 0.3105277833277834,
"eval_R@M": 0.3187178987678989,
"eval_loss": 2.156297445297241,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 281.7625,
"eval_samples_per_second": 1.775,
"eval_steps_per_second": 1.775,
"step": 12500
},
{
"epoch": 13.0,
"learning_rate": 7.553673469387756e-05,
"loss": 0.6823,
"step": 13000
},
{
"epoch": 13.0,
"eval_F1@10": 0.25070757222690915,
"eval_F1@5": 0.34642384380325597,
"eval_F1@M": 0.36789754023066784,
"eval_P@10": 0.21759999999999993,
"eval_P@5": 0.4223999999999997,
"eval_P@M": 0.47199523809523813,
"eval_R@10": 0.3204831224331225,
"eval_R@5": 0.3122700632700633,
"eval_R@M": 0.3204831224331225,
"eval_loss": 2.154297113418579,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 283.3444,
"eval_samples_per_second": 1.765,
"eval_steps_per_second": 1.765,
"step": 13000
},
{
"epoch": 13.5,
"learning_rate": 7.451632653061224e-05,
"loss": 0.6039,
"step": 13500
},
{
"epoch": 13.5,
"eval_F1@10": 0.24724974591747426,
"eval_F1@5": 0.34381850469791675,
"eval_F1@M": 0.36370015266810973,
"eval_P@10": 0.21420000000000003,
"eval_P@5": 0.4179999999999999,
"eval_P@M": 0.4715571428571432,
"eval_R@10": 0.31813237873237904,
"eval_R@5": 0.31155258075258097,
"eval_R@M": 0.31813237873237904,
"eval_loss": 2.273547410964966,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 282.8458,
"eval_samples_per_second": 1.768,
"eval_steps_per_second": 1.768,
"step": 13500
},
{
"epoch": 14.0,
"learning_rate": 7.349591836734695e-05,
"loss": 0.6657,
"step": 14000
},
{
"epoch": 14.0,
"eval_F1@10": 0.24294545526488653,
"eval_F1@5": 0.33743259452965385,
"eval_F1@M": 0.35771661821151046,
"eval_P@10": 0.21059999999999995,
"eval_P@5": 0.4103999999999999,
"eval_P@M": 0.4632714285714285,
"eval_R@10": 0.3123259573759575,
"eval_R@5": 0.3057819458319459,
"eval_R@M": 0.3123259573759575,
"eval_loss": 2.2293343544006348,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 284.7498,
"eval_samples_per_second": 1.756,
"eval_steps_per_second": 1.756,
"step": 14000
},
{
"epoch": 14.5,
"learning_rate": 7.247551020408163e-05,
"loss": 0.5512,
"step": 14500
},
{
"epoch": 14.5,
"eval_F1@10": 0.24609090645971843,
"eval_F1@5": 0.341195668057433,
"eval_F1@M": 0.3638307651069263,
"eval_P@10": 0.2134,
"eval_P@5": 0.4151999999999999,
"eval_P@M": 0.47303809523809526,
"eval_R@10": 0.31571549561549583,
"eval_R@5": 0.3083380064380067,
"eval_R@M": 0.31571549561549583,
"eval_loss": 2.2570900917053223,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 289.2337,
"eval_samples_per_second": 1.729,
"eval_steps_per_second": 1.729,
"step": 14500
},
{
"epoch": 15.0,
"learning_rate": 7.145510204081633e-05,
"loss": 0.6125,
"step": 15000
},
{
"epoch": 15.0,
"eval_F1@10": 0.24506923303510375,
"eval_F1@5": 0.34101718379659585,
"eval_F1@M": 0.36054259558810675,
"eval_P@10": 0.21240000000000006,
"eval_P@5": 0.41520000000000007,
"eval_P@M": 0.46649523809523824,
"eval_R@10": 0.3145362748362751,
"eval_R@5": 0.30819146964146976,
"eval_R@M": 0.3145362748362751,
"eval_loss": 2.300617218017578,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 285.2317,
"eval_samples_per_second": 1.753,
"eval_steps_per_second": 1.753,
"step": 15000
},
{
"epoch": 15.5,
"learning_rate": 7.043673469387755e-05,
"loss": 0.5785,
"step": 15500
},
{
"epoch": 15.5,
"eval_F1@10": 0.2442251260644657,
"eval_F1@5": 0.33893644394820904,
"eval_F1@M": 0.35870379697701743,
"eval_P@10": 0.21159999999999998,
"eval_P@5": 0.41240000000000004,
"eval_P@M": 0.46347380952380973,
"eval_R@10": 0.3134413031413033,
"eval_R@5": 0.3057845210345211,
"eval_R@M": 0.3134413031413033,
"eval_loss": 2.338202953338623,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 289.9816,
"eval_samples_per_second": 1.724,
"eval_steps_per_second": 1.724,
"step": 15500
},
{
"epoch": 16.0,
"learning_rate": 6.941632653061226e-05,
"loss": 0.5428,
"step": 16000
},
{
"epoch": 16.0,
"eval_F1@10": 0.2432725372472316,
"eval_F1@5": 0.3373570716864839,
"eval_F1@M": 0.3582228556960761,
"eval_P@10": 0.21059999999999998,
"eval_P@5": 0.4095999999999998,
"eval_P@M": 0.46375,
"eval_R@10": 0.3134618159618162,
"eval_R@5": 0.30584154179154194,
"eval_R@M": 0.3134618159618162,
"eval_loss": 2.3253493309020996,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 289.4094,
"eval_samples_per_second": 1.728,
"eval_steps_per_second": 1.728,
"step": 16000
},
{
"epoch": 16.5,
"learning_rate": 6.839591836734694e-05,
"loss": 0.5194,
"step": 16500
},
{
"epoch": 16.5,
"eval_F1@10": 0.2355793420179682,
"eval_F1@5": 0.3278029424823546,
"eval_F1@M": 0.3482424748282339,
"eval_P@10": 0.20440000000000003,
"eval_P@5": 0.3991999999999999,
"eval_P@M": 0.4537833333333335,
"eval_R@10": 0.30187379287379296,
"eval_R@5": 0.2962392329892331,
"eval_R@M": 0.30187379287379296,
"eval_loss": 2.3528101444244385,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 290.7706,
"eval_samples_per_second": 1.72,
"eval_steps_per_second": 1.72,
"step": 16500
},
{
"epoch": 17.0,
"learning_rate": 6.737551020408163e-05,
"loss": 0.5194,
"step": 17000
},
{
"epoch": 17.0,
"eval_F1@10": 0.24069023813939067,
"eval_F1@5": 0.33479577971048596,
"eval_F1@M": 0.355847497067776,
"eval_P@10": 0.20800000000000002,
"eval_P@5": 0.40559999999999996,
"eval_P@M": 0.46179999999999993,
"eval_R@10": 0.311403085803086,
"eval_R@5": 0.3045922632922635,
"eval_R@M": 0.311403085803086,
"eval_loss": 2.3786723613739014,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 272.2042,
"eval_samples_per_second": 1.837,
"eval_steps_per_second": 1.837,
"step": 17000
},
{
"epoch": 17.5,
"learning_rate": 6.635510204081633e-05,
"loss": 0.4734,
"step": 17500
},
{
"epoch": 17.5,
"eval_F1@10": 0.2424905535962076,
"eval_F1@5": 0.33929873949579886,
"eval_F1@M": 0.36014400369152755,
"eval_P@10": 0.20979999999999996,
"eval_P@5": 0.4119999999999998,
"eval_P@M": 0.46821190476190494,
"eval_R@10": 0.3125397380397382,
"eval_R@5": 0.3077346153846155,
"eval_R@M": 0.3125397380397382,
"eval_loss": 2.3801848888397217,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 269.1685,
"eval_samples_per_second": 1.858,
"eval_steps_per_second": 1.858,
"step": 17500
},
{
"epoch": 18.0,
"learning_rate": 6.533469387755102e-05,
"loss": 0.4685,
"step": 18000
},
{
"epoch": 18.0,
"eval_F1@10": 0.2428809489937239,
"eval_F1@5": 0.34102215725451057,
"eval_F1@M": 0.36136990799018703,
"eval_P@10": 0.20919999999999994,
"eval_P@5": 0.41119999999999984,
"eval_P@M": 0.4681333333333333,
"eval_R@10": 0.31634897324897343,
"eval_R@5": 0.31194796314796325,
"eval_R@M": 0.31634897324897343,
"eval_loss": 2.4091179370880127,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 264.9477,
"eval_samples_per_second": 1.887,
"eval_steps_per_second": 1.887,
"step": 18000
},
{
"epoch": 18.5,
"learning_rate": 6.431428571428572e-05,
"loss": 0.4574,
"step": 18500
},
{
"epoch": 18.5,
"eval_F1@10": 0.24470615952450722,
"eval_F1@5": 0.34083279204455713,
"eval_F1@M": 0.3591474804177593,
"eval_P@10": 0.21199999999999997,
"eval_P@5": 0.41440000000000005,
"eval_P@M": 0.46359047619047605,
"eval_R@10": 0.31490344655344676,
"eval_R@5": 0.30879514929514945,
"eval_R@M": 0.31490344655344676,
"eval_loss": 2.414991617202759,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 289.5904,
"eval_samples_per_second": 1.727,
"eval_steps_per_second": 1.727,
"step": 18500
},
{
"epoch": 19.0,
"learning_rate": 6.329387755102041e-05,
"loss": 0.4411,
"step": 19000
},
{
"epoch": 19.0,
"eval_F1@10": 0.2413860020074456,
"eval_F1@5": 0.3365299011446076,
"eval_F1@M": 0.3552537179710558,
"eval_P@10": 0.20879999999999999,
"eval_P@5": 0.4083999999999998,
"eval_P@M": 0.4593714285714285,
"eval_R@10": 0.31052307137307145,
"eval_R@5": 0.3046235042735043,
"eval_R@M": 0.31052307137307145,
"eval_loss": 2.5369248390197754,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 281.7996,
"eval_samples_per_second": 1.774,
"eval_steps_per_second": 1.774,
"step": 19000
},
{
"epoch": 19.5,
"learning_rate": 6.22734693877551e-05,
"loss": 0.4032,
"step": 19500
},
{
"epoch": 19.5,
"eval_F1@10": 0.2432083462438766,
"eval_F1@5": 0.3403430030753566,
"eval_F1@M": 0.35755804044596656,
"eval_P@10": 0.2102,
"eval_P@5": 0.4132000000000002,
"eval_P@M": 0.4617999999999998,
"eval_R@10": 0.3141284104784106,
"eval_R@5": 0.30864017094017104,
"eval_R@M": 0.3141284104784106,
"eval_loss": 2.560804605484009,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 296.5123,
"eval_samples_per_second": 1.686,
"eval_steps_per_second": 1.686,
"step": 19500
},
{
"epoch": 20.0,
"learning_rate": 6.125510204081633e-05,
"loss": 0.4402,
"step": 20000
},
{
"epoch": 20.0,
"eval_F1@10": 0.24569117638243435,
"eval_F1@5": 0.3409062858709922,
"eval_F1@M": 0.3611119221851426,
"eval_P@10": 0.21239999999999998,
"eval_P@5": 0.41359999999999997,
"eval_P@M": 0.4668095238095235,
"eval_R@10": 0.3174460150960153,
"eval_R@5": 0.3095908924408926,
"eval_R@M": 0.3174460150960153,
"eval_loss": 2.5116209983825684,
"eval_model_name": "t5-small-keyword-generation-inspec",
"eval_runtime": 280.4633,
"eval_samples_per_second": 1.783,
"eval_steps_per_second": 1.783,
"step": 20000
}
],
"max_steps": 50000,
"num_train_epochs": 50,
"total_flos": 2706836029440000.0,
"trial_name": null,
"trial_params": null
}