{ "best_metric": 0.3611119221851426, "best_model_checkpoint": "t5-small-keyword-generation-inspec\\checkpoint-20000", "epoch": 20.0, "global_step": 20000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.5, "learning_rate": 4.93e-05, "loss": 7.9531, "step": 500 }, { "epoch": 0.5, "eval_F1@10": 0.0, "eval_F1@5": 0.0, "eval_F1@M": 0.0, "eval_P@10": 0.0, "eval_P@5": 0.0, "eval_P@M": 0.0, "eval_R@10": 0.0, "eval_R@5": 0.0, "eval_R@M": 0.0, "eval_loss": 4.233538627624512, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 294.894, "eval_samples_per_second": 1.696, "eval_steps_per_second": 1.696, "step": 500 }, { "epoch": 1.0, "learning_rate": 9.93e-05, "loss": 3.9646, "step": 1000 }, { "epoch": 1.0, "eval_F1@10": 0.1977849653076471, "eval_F1@5": 0.2771428832605307, "eval_F1@M": 0.3029857823291265, "eval_P@10": 0.17059999999999995, "eval_P@5": 0.33559999999999995, "eval_P@M": 0.42588095238095236, "eval_R@10": 0.2556045288045292, "eval_R@5": 0.251349622599623, "eval_R@M": 0.2556045288045292, "eval_loss": 2.812638282775879, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 298.6756, "eval_samples_per_second": 1.674, "eval_steps_per_second": 1.674, "step": 1000 }, { "epoch": 1.5, "learning_rate": 9.899387755102041e-05, "loss": 2.9718, "step": 1500 }, { "epoch": 1.5, "eval_F1@10": 0.21689912919673357, "eval_F1@5": 0.303470865735572, "eval_F1@M": 0.3314612888315681, "eval_P@10": 0.18799999999999992, "eval_P@5": 0.3703999999999999, "eval_P@M": 0.4614, "eval_R@10": 0.2789250194250196, "eval_R@5": 0.27387566877566905, "eval_R@M": 0.2789250194250196, "eval_loss": 2.4728078842163086, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 307.3423, "eval_samples_per_second": 1.627, "eval_steps_per_second": 1.627, "step": 1500 }, { "epoch": 2.0, "learning_rate": 9.79734693877551e-05, "loss": 2.5763, "step": 2000 }, { "epoch": 2.0, "eval_F1@10": 0.21342376898165072, "eval_F1@5": 0.29715987117457776, "eval_F1@M": 0.3246857584795672, "eval_P@10": 0.18480000000000008, "eval_P@5": 0.3628000000000001, "eval_P@M": 0.44907619047619074, "eval_R@10": 0.2744417082917087, "eval_R@5": 0.2677502941502946, "eval_R@M": 0.2744417082917087, "eval_loss": 2.183018445968628, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 289.0824, "eval_samples_per_second": 1.73, "eval_steps_per_second": 1.73, "step": 2000 }, { "epoch": 2.5, "learning_rate": 9.695510204081633e-05, "loss": 2.2131, "step": 2500 }, { "epoch": 2.5, "eval_F1@10": 0.22083437505943945, "eval_F1@5": 0.3085772965596502, "eval_F1@M": 0.33408261078446894, "eval_P@10": 0.1906, "eval_P@5": 0.3736000000000001, "eval_P@M": 0.45226190476190464, "eval_R@10": 0.2875526029526035, "eval_R@5": 0.28179986124986167, "eval_R@M": 0.2875526029526035, "eval_loss": 2.037614107131958, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 294.2365, "eval_samples_per_second": 1.699, "eval_steps_per_second": 1.699, "step": 2500 }, { "epoch": 3.0, "learning_rate": 9.593469387755103e-05, "loss": 2.0094, "step": 3000 }, { "epoch": 3.0, "eval_F1@10": 0.23622480848222596, "eval_F1@5": 0.32680995997466633, "eval_F1@M": 0.3509576027172007, "eval_P@10": 0.2044, "eval_P@5": 0.39799999999999996, "eval_P@M": 0.4652142857142857, "eval_R@10": 0.30521768231768254, "eval_R@5": 0.29608175158175193, "eval_R@M": 0.30521768231768254, "eval_loss": 1.9597641229629517, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 299.8378, "eval_samples_per_second": 1.668, "eval_steps_per_second": 1.668, "step": 3000 }, { "epoch": 3.5, "learning_rate": 9.491428571428572e-05, "loss": 1.7087, "step": 3500 }, { "epoch": 3.5, "eval_F1@10": 0.23585947180128827, "eval_F1@5": 0.32583185474656123, "eval_F1@M": 0.3484568159051137, "eval_P@10": 0.20420000000000005, "eval_P@5": 0.39679999999999993, "eval_P@M": 0.457257142857143, "eval_R@10": 0.3021705960705962, "eval_R@5": 0.2934577533577537, "eval_R@M": 0.3021705960705962, "eval_loss": 1.9531850814819336, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 291.44, "eval_samples_per_second": 1.716, "eval_steps_per_second": 1.716, "step": 3500 }, { "epoch": 4.0, "learning_rate": 9.389387755102042e-05, "loss": 1.7346, "step": 4000 }, { "epoch": 4.0, "eval_F1@10": 0.23949844293171174, "eval_F1@5": 0.3324181589652182, "eval_F1@M": 0.3555839600200287, "eval_P@10": 0.20739999999999992, "eval_P@5": 0.40439999999999987, "eval_P@M": 0.46959285714285726, "eval_R@10": 0.307689471639472, "eval_R@5": 0.30029141969142004, "eval_R@M": 0.307689471639472, "eval_loss": 1.8844341039657593, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 279.8232, "eval_samples_per_second": 1.787, "eval_steps_per_second": 1.787, "step": 4000 }, { "epoch": 4.5, "learning_rate": 9.287551020408164e-05, "loss": 1.4093, "step": 4500 }, { "epoch": 4.5, "eval_F1@10": 0.23374703381451323, "eval_F1@5": 0.3258455720749842, "eval_F1@M": 0.34501260196631756, "eval_P@10": 0.2024, "eval_P@5": 0.3964, "eval_P@M": 0.4511738095238098, "eval_R@10": 0.29999401709401724, "eval_R@5": 0.2942325452325456, "eval_R@M": 0.29999401709401724, "eval_loss": 1.8626010417938232, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 281.3111, "eval_samples_per_second": 1.777, "eval_steps_per_second": 1.777, "step": 4500 }, { "epoch": 5.0, "learning_rate": 9.185510204081633e-05, "loss": 1.5068, "step": 5000 }, { "epoch": 5.0, "eval_F1@10": 0.24335615627100407, "eval_F1@5": 0.3396655599302659, "eval_F1@M": 0.3602646628912888, "eval_P@10": 0.21099999999999977, "eval_P@5": 0.4139999999999996, "eval_P@M": 0.4727857142857141, "eval_R@10": 0.3119000777000777, "eval_R@5": 0.30657915417915416, "eval_R@M": 0.3119000777000777, "eval_loss": 1.7979589700698853, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 280.6796, "eval_samples_per_second": 1.781, "eval_steps_per_second": 1.781, "step": 5000 }, { "epoch": 5.5, "learning_rate": 9.083469387755103e-05, "loss": 1.3146, "step": 5500 }, { "epoch": 5.5, "eval_F1@10": 0.24001641670200757, "eval_F1@5": 0.334409038673745, "eval_F1@M": 0.3550115948035458, "eval_P@10": 0.20839999999999997, "eval_P@5": 0.40799999999999986, "eval_P@M": 0.46737857142857153, "eval_R@10": 0.30688550338550347, "eval_R@5": 0.30161761016761024, "eval_R@M": 0.30688550338550347, "eval_loss": 1.8715476989746094, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 280.9732, "eval_samples_per_second": 1.78, "eval_steps_per_second": 1.78, "step": 5500 }, { "epoch": 6.0, "learning_rate": 8.981428571428572e-05, "loss": 1.2704, "step": 6000 }, { "epoch": 6.0, "eval_F1@10": 0.24096180425219377, "eval_F1@5": 0.334974600889307, "eval_F1@M": 0.35426202280691466, "eval_P@10": 0.20859999999999995, "eval_P@5": 0.4076, "eval_P@M": 0.4599071428571428, "eval_R@10": 0.30986234321234324, "eval_R@5": 0.30275404595404604, "eval_R@M": 0.30986234321234324, "eval_loss": 1.8688002824783325, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 279.0562, "eval_samples_per_second": 1.792, "eval_steps_per_second": 1.792, "step": 6000 }, { "epoch": 6.5, "learning_rate": 8.879591836734694e-05, "loss": 1.1731, "step": 6500 }, { "epoch": 6.5, "eval_F1@10": 0.2441899110215107, "eval_F1@5": 0.3420338693985756, "eval_F1@M": 0.36420169024302196, "eval_P@10": 0.2115999999999999, "eval_P@5": 0.41599999999999987, "eval_P@M": 0.4780619047619047, "eval_R@10": 0.31397009102009105, "eval_R@5": 0.3098475080475081, "eval_R@M": 0.31397009102009105, "eval_loss": 1.8536425828933716, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 291.8339, "eval_samples_per_second": 1.713, "eval_steps_per_second": 1.713, "step": 6500 }, { "epoch": 7.0, "learning_rate": 8.777551020408164e-05, "loss": 1.1174, "step": 7000 }, { "epoch": 7.0, "eval_F1@10": 0.24262947404967916, "eval_F1@5": 0.33894085685556324, "eval_F1@M": 0.35926122996370713, "eval_P@10": 0.21039999999999992, "eval_P@5": 0.4128, "eval_P@M": 0.46843333333333326, "eval_R@10": 0.31144045954045946, "eval_R@5": 0.30653605838605835, "eval_R@M": 0.31144045954045946, "eval_loss": 1.8547453880310059, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 293.7424, "eval_samples_per_second": 1.702, "eval_steps_per_second": 1.702, "step": 7000 }, { "epoch": 7.5, "learning_rate": 8.675510204081633e-05, "loss": 1.0319, "step": 7500 }, { "epoch": 7.5, "eval_F1@10": 0.24435341427092733, "eval_F1@5": 0.34094378497319694, "eval_F1@M": 0.36301657635450263, "eval_P@10": 0.21159999999999995, "eval_P@5": 0.4139999999999999, "eval_P@M": 0.4739333333333334, "eval_R@10": 0.31494397269397284, "eval_R@5": 0.30938704628704644, "eval_R@M": 0.31494397269397284, "eval_loss": 1.8866732120513916, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 298.9317, "eval_samples_per_second": 1.673, "eval_steps_per_second": 1.673, "step": 7500 }, { "epoch": 8.0, "learning_rate": 8.573469387755101e-05, "loss": 1.0172, "step": 8000 }, { "epoch": 8.0, "eval_F1@10": 0.2461478679992482, "eval_F1@5": 0.34169924781101274, "eval_F1@M": 0.36424212479986534, "eval_P@10": 0.21280000000000002, "eval_P@5": 0.41439999999999994, "eval_P@M": 0.47244523809523775, "eval_R@10": 0.3185173215673219, "eval_R@5": 0.3108509435009436, "eval_R@M": 0.3185173215673219, "eval_loss": 1.9575016498565674, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 264.7319, "eval_samples_per_second": 1.889, "eval_steps_per_second": 1.889, "step": 8000 }, { "epoch": 8.5, "learning_rate": 8.471632653061225e-05, "loss": 0.9324, "step": 8500 }, { "epoch": 8.5, "eval_F1@10": 0.23868666530445426, "eval_F1@5": 0.3324125028566208, "eval_F1@M": 0.3539066449202676, "eval_P@10": 0.20719999999999994, "eval_P@5": 0.4051999999999999, "eval_P@M": 0.46190476190476165, "eval_R@10": 0.3066111166611168, "eval_R@5": 0.3009154456654457, "eval_R@M": 0.3066111166611168, "eval_loss": 1.9488437175750732, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 286.0434, "eval_samples_per_second": 1.748, "eval_steps_per_second": 1.748, "step": 8500 }, { "epoch": 9.0, "learning_rate": 8.369591836734695e-05, "loss": 0.9587, "step": 9000 }, { "epoch": 9.0, "eval_F1@10": 0.23996280126000177, "eval_F1@5": 0.33370613928555143, "eval_F1@M": 0.3559531203402726, "eval_P@10": 0.20799999999999982, "eval_P@5": 0.4059999999999997, "eval_P@M": 0.4660785714285711, "eval_R@10": 0.30781457986458, "eval_R@5": 0.30168088578088587, "eval_R@M": 0.30781457986458, "eval_loss": 1.9363871812820435, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 282.9341, "eval_samples_per_second": 1.767, "eval_steps_per_second": 1.767, "step": 9000 }, { "epoch": 9.5, "learning_rate": 8.267551020408164e-05, "loss": 0.8864, "step": 9500 }, { "epoch": 9.5, "eval_F1@10": 0.24553398899899156, "eval_F1@5": 0.33974727821198425, "eval_F1@M": 0.36148470868656674, "eval_P@10": 0.21259999999999998, "eval_P@5": 0.4128, "eval_P@M": 0.46541666666666653, "eval_R@10": 0.3148071484071486, "eval_R@5": 0.3069217227217229, "eval_R@M": 0.3148071484071486, "eval_loss": 2.0047595500946045, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 283.5357, "eval_samples_per_second": 1.763, "eval_steps_per_second": 1.763, "step": 9500 }, { "epoch": 10.0, "learning_rate": 8.165510204081634e-05, "loss": 0.8219, "step": 10000 }, { "epoch": 10.0, "eval_F1@10": 0.24542163861026467, "eval_F1@5": 0.3405659428806491, "eval_F1@M": 0.36243521048954536, "eval_P@10": 0.2128, "eval_P@5": 0.4147999999999997, "eval_P@M": 0.471490476190476, "eval_R@10": 0.31549298479298493, "eval_R@5": 0.30797812187812196, "eval_R@M": 0.31549298479298493, "eval_loss": 2.050034999847412, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 284.698, "eval_samples_per_second": 1.756, "eval_steps_per_second": 1.756, "step": 10000 }, { "epoch": 10.5, "learning_rate": 8.063469387755103e-05, "loss": 0.7906, "step": 10500 }, { "epoch": 10.5, "eval_F1@10": 0.24112739408629902, "eval_F1@5": 0.3361905365875957, "eval_F1@M": 0.35434909789213215, "eval_P@10": 0.20859999999999984, "eval_P@5": 0.4083999999999998, "eval_P@M": 0.4588999999999998, "eval_R@10": 0.3117027250527253, "eval_R@5": 0.3052405316905319, "eval_R@M": 0.3117027250527253, "eval_loss": 2.076453685760498, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 283.1972, "eval_samples_per_second": 1.766, "eval_steps_per_second": 1.766, "step": 10500 }, { "epoch": 11.0, "learning_rate": 7.961632653061225e-05, "loss": 0.7828, "step": 11000 }, { "epoch": 11.0, "eval_F1@10": 0.2434173157573352, "eval_F1@5": 0.3369145302410012, "eval_F1@M": 0.35818623186239346, "eval_P@10": 0.21079999999999996, "eval_P@5": 0.40959999999999974, "eval_P@M": 0.4597690476190474, "eval_R@10": 0.3140421911421914, "eval_R@5": 0.3053971694971696, "eval_R@M": 0.3140421911421914, "eval_loss": 2.0442428588867188, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 283.6328, "eval_samples_per_second": 1.763, "eval_steps_per_second": 1.763, "step": 11000 }, { "epoch": 11.5, "learning_rate": 7.859795918367348e-05, "loss": 0.7724, "step": 11500 }, { "epoch": 11.5, "eval_F1@10": 0.24332780944321591, "eval_F1@5": 0.3358317365640898, "eval_F1@M": 0.3594637432399048, "eval_P@10": 0.21079999999999996, "eval_P@5": 0.40799999999999986, "eval_P@M": 0.4666904761904761, "eval_R@10": 0.31255604395604414, "eval_R@5": 0.3039292041292042, "eval_R@M": 0.31255604395604414, "eval_loss": 2.1262500286102295, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 283.3582, "eval_samples_per_second": 1.765, "eval_steps_per_second": 1.765, "step": 11500 }, { "epoch": 12.0, "learning_rate": 7.757755102040817e-05, "loss": 0.6985, "step": 12000 }, { "epoch": 12.0, "eval_F1@10": 0.24282010444872945, "eval_F1@5": 0.33782710328886834, "eval_F1@M": 0.35967159486540345, "eval_P@10": 0.2104, "eval_P@5": 0.4112, "eval_P@M": 0.4646380952380953, "eval_R@10": 0.31213939948939956, "eval_R@5": 0.30527879342879344, "eval_R@M": 0.31213939948939956, "eval_loss": 2.0867960453033447, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 281.5635, "eval_samples_per_second": 1.776, "eval_steps_per_second": 1.776, "step": 12000 }, { "epoch": 12.5, "learning_rate": 7.655714285714286e-05, "loss": 0.6647, "step": 12500 }, { "epoch": 12.5, "eval_F1@10": 0.24765508121946467, "eval_F1@5": 0.3433662775133368, "eval_F1@M": 0.3637068867664847, "eval_P@10": 0.21459999999999982, "eval_P@5": 0.4179999999999996, "eval_P@M": 0.4680285714285711, "eval_R@10": 0.3187178987678989, "eval_R@5": 0.3105277833277834, "eval_R@M": 0.3187178987678989, "eval_loss": 2.156297445297241, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 281.7625, "eval_samples_per_second": 1.775, "eval_steps_per_second": 1.775, "step": 12500 }, { "epoch": 13.0, "learning_rate": 7.553673469387756e-05, "loss": 0.6823, "step": 13000 }, { "epoch": 13.0, "eval_F1@10": 0.25070757222690915, "eval_F1@5": 0.34642384380325597, "eval_F1@M": 0.36789754023066784, "eval_P@10": 0.21759999999999993, "eval_P@5": 0.4223999999999997, "eval_P@M": 0.47199523809523813, "eval_R@10": 0.3204831224331225, "eval_R@5": 0.3122700632700633, "eval_R@M": 0.3204831224331225, "eval_loss": 2.154297113418579, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 283.3444, "eval_samples_per_second": 1.765, "eval_steps_per_second": 1.765, "step": 13000 }, { "epoch": 13.5, "learning_rate": 7.451632653061224e-05, "loss": 0.6039, "step": 13500 }, { "epoch": 13.5, "eval_F1@10": 0.24724974591747426, "eval_F1@5": 0.34381850469791675, "eval_F1@M": 0.36370015266810973, "eval_P@10": 0.21420000000000003, "eval_P@5": 0.4179999999999999, "eval_P@M": 0.4715571428571432, "eval_R@10": 0.31813237873237904, "eval_R@5": 0.31155258075258097, "eval_R@M": 0.31813237873237904, "eval_loss": 2.273547410964966, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 282.8458, "eval_samples_per_second": 1.768, "eval_steps_per_second": 1.768, "step": 13500 }, { "epoch": 14.0, "learning_rate": 7.349591836734695e-05, "loss": 0.6657, "step": 14000 }, { "epoch": 14.0, "eval_F1@10": 0.24294545526488653, "eval_F1@5": 0.33743259452965385, "eval_F1@M": 0.35771661821151046, "eval_P@10": 0.21059999999999995, "eval_P@5": 0.4103999999999999, "eval_P@M": 0.4632714285714285, "eval_R@10": 0.3123259573759575, "eval_R@5": 0.3057819458319459, "eval_R@M": 0.3123259573759575, "eval_loss": 2.2293343544006348, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 284.7498, "eval_samples_per_second": 1.756, "eval_steps_per_second": 1.756, "step": 14000 }, { "epoch": 14.5, "learning_rate": 7.247551020408163e-05, "loss": 0.5512, "step": 14500 }, { "epoch": 14.5, "eval_F1@10": 0.24609090645971843, "eval_F1@5": 0.341195668057433, "eval_F1@M": 0.3638307651069263, "eval_P@10": 0.2134, "eval_P@5": 0.4151999999999999, "eval_P@M": 0.47303809523809526, "eval_R@10": 0.31571549561549583, "eval_R@5": 0.3083380064380067, "eval_R@M": 0.31571549561549583, "eval_loss": 2.2570900917053223, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 289.2337, "eval_samples_per_second": 1.729, "eval_steps_per_second": 1.729, "step": 14500 }, { "epoch": 15.0, "learning_rate": 7.145510204081633e-05, "loss": 0.6125, "step": 15000 }, { "epoch": 15.0, "eval_F1@10": 0.24506923303510375, "eval_F1@5": 0.34101718379659585, "eval_F1@M": 0.36054259558810675, "eval_P@10": 0.21240000000000006, "eval_P@5": 0.41520000000000007, "eval_P@M": 0.46649523809523824, "eval_R@10": 0.3145362748362751, "eval_R@5": 0.30819146964146976, "eval_R@M": 0.3145362748362751, "eval_loss": 2.300617218017578, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 285.2317, "eval_samples_per_second": 1.753, "eval_steps_per_second": 1.753, "step": 15000 }, { "epoch": 15.5, "learning_rate": 7.043673469387755e-05, "loss": 0.5785, "step": 15500 }, { "epoch": 15.5, "eval_F1@10": 0.2442251260644657, "eval_F1@5": 0.33893644394820904, "eval_F1@M": 0.35870379697701743, "eval_P@10": 0.21159999999999998, "eval_P@5": 0.41240000000000004, "eval_P@M": 0.46347380952380973, "eval_R@10": 0.3134413031413033, "eval_R@5": 0.3057845210345211, "eval_R@M": 0.3134413031413033, "eval_loss": 2.338202953338623, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 289.9816, "eval_samples_per_second": 1.724, "eval_steps_per_second": 1.724, "step": 15500 }, { "epoch": 16.0, "learning_rate": 6.941632653061226e-05, "loss": 0.5428, "step": 16000 }, { "epoch": 16.0, "eval_F1@10": 0.2432725372472316, "eval_F1@5": 0.3373570716864839, "eval_F1@M": 0.3582228556960761, "eval_P@10": 0.21059999999999998, "eval_P@5": 0.4095999999999998, "eval_P@M": 0.46375, "eval_R@10": 0.3134618159618162, "eval_R@5": 0.30584154179154194, "eval_R@M": 0.3134618159618162, "eval_loss": 2.3253493309020996, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 289.4094, "eval_samples_per_second": 1.728, "eval_steps_per_second": 1.728, "step": 16000 }, { "epoch": 16.5, "learning_rate": 6.839591836734694e-05, "loss": 0.5194, "step": 16500 }, { "epoch": 16.5, "eval_F1@10": 0.2355793420179682, "eval_F1@5": 0.3278029424823546, "eval_F1@M": 0.3482424748282339, "eval_P@10": 0.20440000000000003, "eval_P@5": 0.3991999999999999, "eval_P@M": 0.4537833333333335, "eval_R@10": 0.30187379287379296, "eval_R@5": 0.2962392329892331, "eval_R@M": 0.30187379287379296, "eval_loss": 2.3528101444244385, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 290.7706, "eval_samples_per_second": 1.72, "eval_steps_per_second": 1.72, "step": 16500 }, { "epoch": 17.0, "learning_rate": 6.737551020408163e-05, "loss": 0.5194, "step": 17000 }, { "epoch": 17.0, "eval_F1@10": 0.24069023813939067, "eval_F1@5": 0.33479577971048596, "eval_F1@M": 0.355847497067776, "eval_P@10": 0.20800000000000002, "eval_P@5": 0.40559999999999996, "eval_P@M": 0.46179999999999993, "eval_R@10": 0.311403085803086, "eval_R@5": 0.3045922632922635, "eval_R@M": 0.311403085803086, "eval_loss": 2.3786723613739014, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 272.2042, "eval_samples_per_second": 1.837, "eval_steps_per_second": 1.837, "step": 17000 }, { "epoch": 17.5, "learning_rate": 6.635510204081633e-05, "loss": 0.4734, "step": 17500 }, { "epoch": 17.5, "eval_F1@10": 0.2424905535962076, "eval_F1@5": 0.33929873949579886, "eval_F1@M": 0.36014400369152755, "eval_P@10": 0.20979999999999996, "eval_P@5": 0.4119999999999998, "eval_P@M": 0.46821190476190494, "eval_R@10": 0.3125397380397382, "eval_R@5": 0.3077346153846155, "eval_R@M": 0.3125397380397382, "eval_loss": 2.3801848888397217, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 269.1685, "eval_samples_per_second": 1.858, "eval_steps_per_second": 1.858, "step": 17500 }, { "epoch": 18.0, "learning_rate": 6.533469387755102e-05, "loss": 0.4685, "step": 18000 }, { "epoch": 18.0, "eval_F1@10": 0.2428809489937239, "eval_F1@5": 0.34102215725451057, "eval_F1@M": 0.36136990799018703, "eval_P@10": 0.20919999999999994, "eval_P@5": 0.41119999999999984, "eval_P@M": 0.4681333333333333, "eval_R@10": 0.31634897324897343, "eval_R@5": 0.31194796314796325, "eval_R@M": 0.31634897324897343, "eval_loss": 2.4091179370880127, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 264.9477, "eval_samples_per_second": 1.887, "eval_steps_per_second": 1.887, "step": 18000 }, { "epoch": 18.5, "learning_rate": 6.431428571428572e-05, "loss": 0.4574, "step": 18500 }, { "epoch": 18.5, "eval_F1@10": 0.24470615952450722, "eval_F1@5": 0.34083279204455713, "eval_F1@M": 0.3591474804177593, "eval_P@10": 0.21199999999999997, "eval_P@5": 0.41440000000000005, "eval_P@M": 0.46359047619047605, "eval_R@10": 0.31490344655344676, "eval_R@5": 0.30879514929514945, "eval_R@M": 0.31490344655344676, "eval_loss": 2.414991617202759, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 289.5904, "eval_samples_per_second": 1.727, "eval_steps_per_second": 1.727, "step": 18500 }, { "epoch": 19.0, "learning_rate": 6.329387755102041e-05, "loss": 0.4411, "step": 19000 }, { "epoch": 19.0, "eval_F1@10": 0.2413860020074456, "eval_F1@5": 0.3365299011446076, "eval_F1@M": 0.3552537179710558, "eval_P@10": 0.20879999999999999, "eval_P@5": 0.4083999999999998, "eval_P@M": 0.4593714285714285, "eval_R@10": 0.31052307137307145, "eval_R@5": 0.3046235042735043, "eval_R@M": 0.31052307137307145, "eval_loss": 2.5369248390197754, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 281.7996, "eval_samples_per_second": 1.774, "eval_steps_per_second": 1.774, "step": 19000 }, { "epoch": 19.5, "learning_rate": 6.22734693877551e-05, "loss": 0.4032, "step": 19500 }, { "epoch": 19.5, "eval_F1@10": 0.2432083462438766, "eval_F1@5": 0.3403430030753566, "eval_F1@M": 0.35755804044596656, "eval_P@10": 0.2102, "eval_P@5": 0.4132000000000002, "eval_P@M": 0.4617999999999998, "eval_R@10": 0.3141284104784106, "eval_R@5": 0.30864017094017104, "eval_R@M": 0.3141284104784106, "eval_loss": 2.560804605484009, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 296.5123, "eval_samples_per_second": 1.686, "eval_steps_per_second": 1.686, "step": 19500 }, { "epoch": 20.0, "learning_rate": 6.125510204081633e-05, "loss": 0.4402, "step": 20000 }, { "epoch": 20.0, "eval_F1@10": 0.24569117638243435, "eval_F1@5": 0.3409062858709922, "eval_F1@M": 0.3611119221851426, "eval_P@10": 0.21239999999999998, "eval_P@5": 0.41359999999999997, "eval_P@M": 0.4668095238095235, "eval_R@10": 0.3174460150960153, "eval_R@5": 0.3095908924408926, "eval_R@M": 0.3174460150960153, "eval_loss": 2.5116209983825684, "eval_model_name": "t5-small-keyword-generation-inspec", "eval_runtime": 280.4633, "eval_samples_per_second": 1.783, "eval_steps_per_second": 1.783, "step": 20000 } ], "max_steps": 50000, "num_train_epochs": 50, "total_flos": 2706836029440000.0, "trial_name": null, "trial_params": null }