classify-news-category-iptc / trainer_state.json
ilsilfverskiold's picture
ilsilfverskiold/iptc-newscodes-multilingual-text-classification
45559ac verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 3.0,
"eval_steps": 200,
"global_step": 2064,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.014534883720930232,
"grad_norm": 5.562132358551025,
"learning_rate": 4.0000000000000003e-07,
"loss": 2.7844,
"step": 10
},
{
"epoch": 0.029069767441860465,
"grad_norm": 6.067043781280518,
"learning_rate": 8.000000000000001e-07,
"loss": 2.7725,
"step": 20
},
{
"epoch": 0.0436046511627907,
"grad_norm": 6.281836986541748,
"learning_rate": 1.2000000000000002e-06,
"loss": 2.7484,
"step": 30
},
{
"epoch": 0.05813953488372093,
"grad_norm": 5.292967319488525,
"learning_rate": 1.6000000000000001e-06,
"loss": 2.6898,
"step": 40
},
{
"epoch": 0.07267441860465117,
"grad_norm": 6.3012261390686035,
"learning_rate": 2.0000000000000003e-06,
"loss": 2.6246,
"step": 50
},
{
"epoch": 0.0872093023255814,
"grad_norm": 5.181797981262207,
"learning_rate": 2.4000000000000003e-06,
"loss": 2.593,
"step": 60
},
{
"epoch": 0.10174418604651163,
"grad_norm": 6.388678073883057,
"learning_rate": 2.8000000000000003e-06,
"loss": 2.5312,
"step": 70
},
{
"epoch": 0.11627906976744186,
"grad_norm": 5.643568992614746,
"learning_rate": 3.2000000000000003e-06,
"loss": 2.4826,
"step": 80
},
{
"epoch": 0.1308139534883721,
"grad_norm": 5.568506240844727,
"learning_rate": 3.6000000000000003e-06,
"loss": 2.4131,
"step": 90
},
{
"epoch": 0.14534883720930233,
"grad_norm": 5.19083833694458,
"learning_rate": 4.000000000000001e-06,
"loss": 2.415,
"step": 100
},
{
"epoch": 0.15988372093023256,
"grad_norm": 5.537081241607666,
"learning_rate": 4.4e-06,
"loss": 2.3401,
"step": 110
},
{
"epoch": 0.1744186046511628,
"grad_norm": 5.086550235748291,
"learning_rate": 4.800000000000001e-06,
"loss": 2.3943,
"step": 120
},
{
"epoch": 0.18895348837209303,
"grad_norm": 7.545917987823486,
"learning_rate": 5.2e-06,
"loss": 2.2582,
"step": 130
},
{
"epoch": 0.20348837209302326,
"grad_norm": 7.227110862731934,
"learning_rate": 5.600000000000001e-06,
"loss": 2.1587,
"step": 140
},
{
"epoch": 0.2180232558139535,
"grad_norm": 6.003934860229492,
"learning_rate": 6e-06,
"loss": 2.0893,
"step": 150
},
{
"epoch": 0.23255813953488372,
"grad_norm": 6.239010810852051,
"learning_rate": 6.4000000000000006e-06,
"loss": 2.0743,
"step": 160
},
{
"epoch": 0.24709302325581395,
"grad_norm": 7.215450763702393,
"learning_rate": 6.800000000000001e-06,
"loss": 2.0095,
"step": 170
},
{
"epoch": 0.2616279069767442,
"grad_norm": 5.769580364227295,
"learning_rate": 7.2000000000000005e-06,
"loss": 2.0063,
"step": 180
},
{
"epoch": 0.2761627906976744,
"grad_norm": 7.701093673706055,
"learning_rate": 7.600000000000001e-06,
"loss": 1.9538,
"step": 190
},
{
"epoch": 0.29069767441860467,
"grad_norm": 8.804961204528809,
"learning_rate": 8.000000000000001e-06,
"loss": 1.9761,
"step": 200
},
{
"epoch": 0.29069767441860467,
"eval_accuracy": 0.64625,
"eval_accuracy_label_arts, culture, entertainment and media": 0.3157894736842105,
"eval_accuracy_label_conflict, war and peace": 0.8315467075038285,
"eval_accuracy_label_crime, law and justice": 0.7628865979381443,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.7054794520547946,
"eval_accuracy_label_economy, business, and finance": 0.5436893203883495,
"eval_accuracy_label_environment": 0.0,
"eval_accuracy_label_health": 0.5,
"eval_accuracy_label_human interest": 0.0,
"eval_accuracy_label_labour": 0.0,
"eval_accuracy_label_lifestyle and leisure": 0.3333333333333333,
"eval_accuracy_label_politics": 0.4843205574912892,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.08333333333333333,
"eval_accuracy_label_society": 0.0,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 0.0,
"eval_f1": 0.6164394441800294,
"eval_loss": 1.4046330451965332,
"eval_precision": 0.6057417123934041,
"eval_recall": 0.64625,
"eval_runtime": 12.4531,
"eval_samples_per_second": 128.482,
"eval_steps_per_second": 8.03,
"step": 200
},
{
"epoch": 0.30523255813953487,
"grad_norm": 7.173561096191406,
"learning_rate": 8.400000000000001e-06,
"loss": 1.7684,
"step": 210
},
{
"epoch": 0.31976744186046513,
"grad_norm": 8.086793899536133,
"learning_rate": 8.8e-06,
"loss": 1.7253,
"step": 220
},
{
"epoch": 0.33430232558139533,
"grad_norm": 8.559186935424805,
"learning_rate": 9.200000000000002e-06,
"loss": 1.795,
"step": 230
},
{
"epoch": 0.3488372093023256,
"grad_norm": 6.066705226898193,
"learning_rate": 9.600000000000001e-06,
"loss": 1.6181,
"step": 240
},
{
"epoch": 0.3633720930232558,
"grad_norm": 13.028596878051758,
"learning_rate": 1e-05,
"loss": 1.6328,
"step": 250
},
{
"epoch": 0.37790697674418605,
"grad_norm": 9.958759307861328,
"learning_rate": 1.04e-05,
"loss": 1.6997,
"step": 260
},
{
"epoch": 0.39244186046511625,
"grad_norm": 11.519359588623047,
"learning_rate": 1.0800000000000002e-05,
"loss": 1.6046,
"step": 270
},
{
"epoch": 0.4069767441860465,
"grad_norm": 8.298735618591309,
"learning_rate": 1.1200000000000001e-05,
"loss": 1.4126,
"step": 280
},
{
"epoch": 0.42151162790697677,
"grad_norm": 10.555624961853027,
"learning_rate": 1.16e-05,
"loss": 1.445,
"step": 290
},
{
"epoch": 0.436046511627907,
"grad_norm": 8.33277702331543,
"learning_rate": 1.2e-05,
"loss": 1.4088,
"step": 300
},
{
"epoch": 0.45058139534883723,
"grad_norm": 10.028512001037598,
"learning_rate": 1.2400000000000002e-05,
"loss": 1.3765,
"step": 310
},
{
"epoch": 0.46511627906976744,
"grad_norm": 11.585610389709473,
"learning_rate": 1.2800000000000001e-05,
"loss": 1.409,
"step": 320
},
{
"epoch": 0.4796511627906977,
"grad_norm": 13.202520370483398,
"learning_rate": 1.3200000000000002e-05,
"loss": 1.3285,
"step": 330
},
{
"epoch": 0.4941860465116279,
"grad_norm": 8.829900741577148,
"learning_rate": 1.3600000000000002e-05,
"loss": 1.3261,
"step": 340
},
{
"epoch": 0.5087209302325582,
"grad_norm": 11.259300231933594,
"learning_rate": 1.4e-05,
"loss": 1.4546,
"step": 350
},
{
"epoch": 0.5232558139534884,
"grad_norm": 8.918652534484863,
"learning_rate": 1.4400000000000001e-05,
"loss": 1.2455,
"step": 360
},
{
"epoch": 0.5377906976744186,
"grad_norm": 10.523372650146484,
"learning_rate": 1.48e-05,
"loss": 1.3496,
"step": 370
},
{
"epoch": 0.5523255813953488,
"grad_norm": 13.649139404296875,
"learning_rate": 1.5200000000000002e-05,
"loss": 1.2688,
"step": 380
},
{
"epoch": 0.5668604651162791,
"grad_norm": 15.79927921295166,
"learning_rate": 1.5600000000000003e-05,
"loss": 1.22,
"step": 390
},
{
"epoch": 0.5813953488372093,
"grad_norm": 12.712923049926758,
"learning_rate": 1.6000000000000003e-05,
"loss": 1.2153,
"step": 400
},
{
"epoch": 0.5813953488372093,
"eval_accuracy": 0.689375,
"eval_accuracy_label_arts, culture, entertainment and media": 0.7894736842105263,
"eval_accuracy_label_conflict, war and peace": 0.655436447166922,
"eval_accuracy_label_crime, law and justice": 0.8195876288659794,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8561643835616438,
"eval_accuracy_label_economy, business, and finance": 0.6407766990291263,
"eval_accuracy_label_environment": 0.2413793103448276,
"eval_accuracy_label_health": 0.8333333333333334,
"eval_accuracy_label_human interest": 0.13636363636363635,
"eval_accuracy_label_labour": 0.0,
"eval_accuracy_label_lifestyle and leisure": 0.6666666666666666,
"eval_accuracy_label_politics": 0.8466898954703833,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.375,
"eval_accuracy_label_society": 0.015384615384615385,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 1.0,
"eval_f1": 0.6867853551801604,
"eval_loss": 1.0224822759628296,
"eval_precision": 0.765204058143133,
"eval_recall": 0.689375,
"eval_runtime": 12.5726,
"eval_samples_per_second": 127.261,
"eval_steps_per_second": 7.954,
"step": 400
},
{
"epoch": 0.5959302325581395,
"grad_norm": 11.235016822814941,
"learning_rate": 1.64e-05,
"loss": 1.2041,
"step": 410
},
{
"epoch": 0.6104651162790697,
"grad_norm": 10.808572769165039,
"learning_rate": 1.6800000000000002e-05,
"loss": 1.1168,
"step": 420
},
{
"epoch": 0.625,
"grad_norm": 16.74306869506836,
"learning_rate": 1.72e-05,
"loss": 1.1227,
"step": 430
},
{
"epoch": 0.6395348837209303,
"grad_norm": 9.389023780822754,
"learning_rate": 1.76e-05,
"loss": 1.1575,
"step": 440
},
{
"epoch": 0.6540697674418605,
"grad_norm": 15.347270965576172,
"learning_rate": 1.8e-05,
"loss": 0.9979,
"step": 450
},
{
"epoch": 0.6686046511627907,
"grad_norm": 11.799999237060547,
"learning_rate": 1.8400000000000003e-05,
"loss": 1.0845,
"step": 460
},
{
"epoch": 0.6831395348837209,
"grad_norm": 12.181020736694336,
"learning_rate": 1.88e-05,
"loss": 1.0833,
"step": 470
},
{
"epoch": 0.6976744186046512,
"grad_norm": 12.819634437561035,
"learning_rate": 1.9200000000000003e-05,
"loss": 1.137,
"step": 480
},
{
"epoch": 0.7122093023255814,
"grad_norm": 13.189191818237305,
"learning_rate": 1.9600000000000002e-05,
"loss": 1.0458,
"step": 490
},
{
"epoch": 0.7267441860465116,
"grad_norm": 9.888482093811035,
"learning_rate": 2e-05,
"loss": 1.0184,
"step": 500
},
{
"epoch": 0.7412790697674418,
"grad_norm": 9.71278190612793,
"learning_rate": 1.987212276214834e-05,
"loss": 0.98,
"step": 510
},
{
"epoch": 0.7558139534883721,
"grad_norm": 14.008501052856445,
"learning_rate": 1.9744245524296677e-05,
"loss": 0.9985,
"step": 520
},
{
"epoch": 0.7703488372093024,
"grad_norm": 16.69378662109375,
"learning_rate": 1.9616368286445014e-05,
"loss": 0.9146,
"step": 530
},
{
"epoch": 0.7848837209302325,
"grad_norm": 15.569829940795898,
"learning_rate": 1.9488491048593352e-05,
"loss": 0.9717,
"step": 540
},
{
"epoch": 0.7994186046511628,
"grad_norm": 10.90029239654541,
"learning_rate": 1.936061381074169e-05,
"loss": 1.0832,
"step": 550
},
{
"epoch": 0.813953488372093,
"grad_norm": 16.751508712768555,
"learning_rate": 1.9232736572890027e-05,
"loss": 0.9345,
"step": 560
},
{
"epoch": 0.8284883720930233,
"grad_norm": 14.394732475280762,
"learning_rate": 1.9104859335038365e-05,
"loss": 1.0405,
"step": 570
},
{
"epoch": 0.8430232558139535,
"grad_norm": 11.01040267944336,
"learning_rate": 1.8976982097186702e-05,
"loss": 0.9115,
"step": 580
},
{
"epoch": 0.8575581395348837,
"grad_norm": 15.872978210449219,
"learning_rate": 1.884910485933504e-05,
"loss": 0.8443,
"step": 590
},
{
"epoch": 0.872093023255814,
"grad_norm": 19.019338607788086,
"learning_rate": 1.8721227621483378e-05,
"loss": 0.954,
"step": 600
},
{
"epoch": 0.872093023255814,
"eval_accuracy": 0.723125,
"eval_accuracy_label_arts, culture, entertainment and media": 0.7368421052631579,
"eval_accuracy_label_conflict, war and peace": 0.77947932618683,
"eval_accuracy_label_crime, law and justice": 0.8917525773195877,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8698630136986302,
"eval_accuracy_label_economy, business, and finance": 0.6213592233009708,
"eval_accuracy_label_environment": 0.3448275862068966,
"eval_accuracy_label_health": 0.8888888888888888,
"eval_accuracy_label_human interest": 0.18181818181818182,
"eval_accuracy_label_labour": 1.0,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.6898954703832753,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.25,
"eval_accuracy_label_society": 0.046153846153846156,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 1.0,
"eval_f1": 0.7137964265878213,
"eval_loss": 0.8858376145362854,
"eval_precision": 0.7308873219026191,
"eval_recall": 0.723125,
"eval_runtime": 12.6079,
"eval_samples_per_second": 126.905,
"eval_steps_per_second": 7.932,
"step": 600
},
{
"epoch": 0.8866279069767442,
"grad_norm": 8.310386657714844,
"learning_rate": 1.8593350383631715e-05,
"loss": 0.8133,
"step": 610
},
{
"epoch": 0.9011627906976745,
"grad_norm": 12.042872428894043,
"learning_rate": 1.8465473145780053e-05,
"loss": 0.9059,
"step": 620
},
{
"epoch": 0.9156976744186046,
"grad_norm": 10.83311653137207,
"learning_rate": 1.833759590792839e-05,
"loss": 0.9357,
"step": 630
},
{
"epoch": 0.9302325581395349,
"grad_norm": 11.619269371032715,
"learning_rate": 1.8209718670076728e-05,
"loss": 0.967,
"step": 640
},
{
"epoch": 0.9447674418604651,
"grad_norm": 11.699959754943848,
"learning_rate": 1.8081841432225066e-05,
"loss": 0.748,
"step": 650
},
{
"epoch": 0.9593023255813954,
"grad_norm": 15.047694206237793,
"learning_rate": 1.7953964194373403e-05,
"loss": 0.8928,
"step": 660
},
{
"epoch": 0.9738372093023255,
"grad_norm": 13.320290565490723,
"learning_rate": 1.782608695652174e-05,
"loss": 0.8786,
"step": 670
},
{
"epoch": 0.9883720930232558,
"grad_norm": 13.041028022766113,
"learning_rate": 1.769820971867008e-05,
"loss": 0.9478,
"step": 680
},
{
"epoch": 1.002906976744186,
"grad_norm": 14.132765769958496,
"learning_rate": 1.7570332480818416e-05,
"loss": 0.8231,
"step": 690
},
{
"epoch": 1.0174418604651163,
"grad_norm": 7.3977837562561035,
"learning_rate": 1.7442455242966754e-05,
"loss": 0.7806,
"step": 700
},
{
"epoch": 1.0319767441860466,
"grad_norm": 16.572118759155273,
"learning_rate": 1.731457800511509e-05,
"loss": 0.7654,
"step": 710
},
{
"epoch": 1.0465116279069768,
"grad_norm": 21.040008544921875,
"learning_rate": 1.718670076726343e-05,
"loss": 0.7856,
"step": 720
},
{
"epoch": 1.0610465116279069,
"grad_norm": 21.33478355407715,
"learning_rate": 1.7058823529411767e-05,
"loss": 0.7323,
"step": 730
},
{
"epoch": 1.0755813953488371,
"grad_norm": 13.03322696685791,
"learning_rate": 1.6930946291560104e-05,
"loss": 0.7396,
"step": 740
},
{
"epoch": 1.0901162790697674,
"grad_norm": 19.618709564208984,
"learning_rate": 1.6803069053708442e-05,
"loss": 0.8284,
"step": 750
},
{
"epoch": 1.1046511627906976,
"grad_norm": 21.11569595336914,
"learning_rate": 1.667519181585678e-05,
"loss": 0.7032,
"step": 760
},
{
"epoch": 1.119186046511628,
"grad_norm": 13.00526237487793,
"learning_rate": 1.6547314578005117e-05,
"loss": 0.7199,
"step": 770
},
{
"epoch": 1.1337209302325582,
"grad_norm": 12.57153034210205,
"learning_rate": 1.6419437340153455e-05,
"loss": 0.6688,
"step": 780
},
{
"epoch": 1.1482558139534884,
"grad_norm": 11.098487854003906,
"learning_rate": 1.6291560102301792e-05,
"loss": 0.6463,
"step": 790
},
{
"epoch": 1.1627906976744187,
"grad_norm": 12.68520736694336,
"learning_rate": 1.616368286445013e-05,
"loss": 0.6662,
"step": 800
},
{
"epoch": 1.1627906976744187,
"eval_accuracy": 0.688125,
"eval_accuracy_label_arts, culture, entertainment and media": 0.7894736842105263,
"eval_accuracy_label_conflict, war and peace": 0.6125574272588055,
"eval_accuracy_label_crime, law and justice": 0.845360824742268,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.863013698630137,
"eval_accuracy_label_economy, business, and finance": 0.6504854368932039,
"eval_accuracy_label_environment": 0.4482758620689655,
"eval_accuracy_label_health": 0.7222222222222222,
"eval_accuracy_label_human interest": 0.22727272727272727,
"eval_accuracy_label_labour": 1.0,
"eval_accuracy_label_lifestyle and leisure": 0.4444444444444444,
"eval_accuracy_label_politics": 0.8292682926829268,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.5416666666666666,
"eval_accuracy_label_society": 0.23076923076923078,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 1.0,
"eval_f1": 0.7008818694331442,
"eval_loss": 0.9380582571029663,
"eval_precision": 0.7617561903814418,
"eval_recall": 0.688125,
"eval_runtime": 12.5844,
"eval_samples_per_second": 127.142,
"eval_steps_per_second": 7.946,
"step": 800
},
{
"epoch": 1.177325581395349,
"grad_norm": 12.958664894104004,
"learning_rate": 1.6035805626598467e-05,
"loss": 0.6513,
"step": 810
},
{
"epoch": 1.191860465116279,
"grad_norm": 13.338906288146973,
"learning_rate": 1.5907928388746805e-05,
"loss": 0.7241,
"step": 820
},
{
"epoch": 1.2063953488372092,
"grad_norm": 12.350173950195312,
"learning_rate": 1.5780051150895143e-05,
"loss": 0.6857,
"step": 830
},
{
"epoch": 1.2209302325581395,
"grad_norm": 9.547300338745117,
"learning_rate": 1.565217391304348e-05,
"loss": 0.5884,
"step": 840
},
{
"epoch": 1.2354651162790697,
"grad_norm": 9.108930587768555,
"learning_rate": 1.5524296675191818e-05,
"loss": 0.5416,
"step": 850
},
{
"epoch": 1.25,
"grad_norm": 7.098880767822266,
"learning_rate": 1.5396419437340155e-05,
"loss": 0.5443,
"step": 860
},
{
"epoch": 1.2645348837209303,
"grad_norm": 15.5491304397583,
"learning_rate": 1.5268542199488493e-05,
"loss": 0.638,
"step": 870
},
{
"epoch": 1.2790697674418605,
"grad_norm": 14.731600761413574,
"learning_rate": 1.514066496163683e-05,
"loss": 0.6516,
"step": 880
},
{
"epoch": 1.2936046511627908,
"grad_norm": 6.682343006134033,
"learning_rate": 1.5012787723785167e-05,
"loss": 0.6165,
"step": 890
},
{
"epoch": 1.308139534883721,
"grad_norm": 14.463234901428223,
"learning_rate": 1.4884910485933506e-05,
"loss": 0.6455,
"step": 900
},
{
"epoch": 1.322674418604651,
"grad_norm": 14.159065246582031,
"learning_rate": 1.4757033248081842e-05,
"loss": 0.6129,
"step": 910
},
{
"epoch": 1.3372093023255813,
"grad_norm": 14.65009880065918,
"learning_rate": 1.4629156010230181e-05,
"loss": 0.5702,
"step": 920
},
{
"epoch": 1.3517441860465116,
"grad_norm": 16.38220977783203,
"learning_rate": 1.4501278772378517e-05,
"loss": 0.6183,
"step": 930
},
{
"epoch": 1.3662790697674418,
"grad_norm": 9.162236213684082,
"learning_rate": 1.4373401534526856e-05,
"loss": 0.547,
"step": 940
},
{
"epoch": 1.380813953488372,
"grad_norm": 9.222379684448242,
"learning_rate": 1.4245524296675192e-05,
"loss": 0.5629,
"step": 950
},
{
"epoch": 1.3953488372093024,
"grad_norm": 8.016491889953613,
"learning_rate": 1.4117647058823532e-05,
"loss": 0.6529,
"step": 960
},
{
"epoch": 1.4098837209302326,
"grad_norm": 8.260580062866211,
"learning_rate": 1.3989769820971867e-05,
"loss": 0.5309,
"step": 970
},
{
"epoch": 1.4244186046511627,
"grad_norm": 16.81390953063965,
"learning_rate": 1.3861892583120207e-05,
"loss": 0.6785,
"step": 980
},
{
"epoch": 1.4389534883720931,
"grad_norm": 11.895804405212402,
"learning_rate": 1.3734015345268543e-05,
"loss": 0.5976,
"step": 990
},
{
"epoch": 1.4534883720930232,
"grad_norm": 8.548684120178223,
"learning_rate": 1.3606138107416882e-05,
"loss": 0.5554,
"step": 1000
},
{
"epoch": 1.4534883720930232,
"eval_accuracy": 0.7025,
"eval_accuracy_label_arts, culture, entertainment and media": 0.7368421052631579,
"eval_accuracy_label_conflict, war and peace": 0.6477794793261868,
"eval_accuracy_label_crime, law and justice": 0.9020618556701031,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8561643835616438,
"eval_accuracy_label_economy, business, and finance": 0.6601941747572816,
"eval_accuracy_label_environment": 0.3103448275862069,
"eval_accuracy_label_health": 0.7777777777777778,
"eval_accuracy_label_human interest": 0.36363636363636365,
"eval_accuracy_label_labour": 0.5,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.8083623693379791,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.5,
"eval_accuracy_label_society": 0.18461538461538463,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 1.0,
"eval_f1": 0.7123723699365401,
"eval_loss": 0.8791087865829468,
"eval_precision": 0.7628439748212975,
"eval_recall": 0.7025,
"eval_runtime": 12.5844,
"eval_samples_per_second": 127.142,
"eval_steps_per_second": 7.946,
"step": 1000
},
{
"epoch": 1.4680232558139534,
"grad_norm": 13.218795776367188,
"learning_rate": 1.3478260869565218e-05,
"loss": 0.5587,
"step": 1010
},
{
"epoch": 1.4825581395348837,
"grad_norm": 21.222410202026367,
"learning_rate": 1.3350383631713557e-05,
"loss": 0.6128,
"step": 1020
},
{
"epoch": 1.497093023255814,
"grad_norm": 10.608304977416992,
"learning_rate": 1.3222506393861893e-05,
"loss": 0.5334,
"step": 1030
},
{
"epoch": 1.5116279069767442,
"grad_norm": 9.839329719543457,
"learning_rate": 1.3094629156010232e-05,
"loss": 0.4974,
"step": 1040
},
{
"epoch": 1.5261627906976745,
"grad_norm": 16.351816177368164,
"learning_rate": 1.2966751918158568e-05,
"loss": 0.5387,
"step": 1050
},
{
"epoch": 1.5406976744186047,
"grad_norm": 13.274540901184082,
"learning_rate": 1.2838874680306906e-05,
"loss": 0.5928,
"step": 1060
},
{
"epoch": 1.5552325581395348,
"grad_norm": 11.493636131286621,
"learning_rate": 1.2710997442455244e-05,
"loss": 0.4391,
"step": 1070
},
{
"epoch": 1.5697674418604652,
"grad_norm": 7.543900012969971,
"learning_rate": 1.2583120204603581e-05,
"loss": 0.5845,
"step": 1080
},
{
"epoch": 1.5843023255813953,
"grad_norm": 18.52677345275879,
"learning_rate": 1.2455242966751919e-05,
"loss": 0.4857,
"step": 1090
},
{
"epoch": 1.5988372093023255,
"grad_norm": 10.437915802001953,
"learning_rate": 1.2327365728900256e-05,
"loss": 0.4946,
"step": 1100
},
{
"epoch": 1.6133720930232558,
"grad_norm": 9.237434387207031,
"learning_rate": 1.2199488491048594e-05,
"loss": 0.6215,
"step": 1110
},
{
"epoch": 1.627906976744186,
"grad_norm": 15.632594108581543,
"learning_rate": 1.2071611253196932e-05,
"loss": 0.5642,
"step": 1120
},
{
"epoch": 1.6424418604651163,
"grad_norm": 16.443044662475586,
"learning_rate": 1.194373401534527e-05,
"loss": 0.5714,
"step": 1130
},
{
"epoch": 1.6569767441860463,
"grad_norm": 15.662179946899414,
"learning_rate": 1.1815856777493607e-05,
"loss": 0.4438,
"step": 1140
},
{
"epoch": 1.6715116279069768,
"grad_norm": 14.527420043945312,
"learning_rate": 1.1687979539641944e-05,
"loss": 0.5733,
"step": 1150
},
{
"epoch": 1.6860465116279069,
"grad_norm": 20.69162368774414,
"learning_rate": 1.1560102301790282e-05,
"loss": 0.5324,
"step": 1160
},
{
"epoch": 1.7005813953488373,
"grad_norm": 11.502646446228027,
"learning_rate": 1.143222506393862e-05,
"loss": 0.4495,
"step": 1170
},
{
"epoch": 1.7151162790697674,
"grad_norm": 8.692178726196289,
"learning_rate": 1.1304347826086957e-05,
"loss": 0.4218,
"step": 1180
},
{
"epoch": 1.7296511627906976,
"grad_norm": 11.3637113571167,
"learning_rate": 1.1176470588235295e-05,
"loss": 0.5778,
"step": 1190
},
{
"epoch": 1.744186046511628,
"grad_norm": 7.9896721839904785,
"learning_rate": 1.1048593350383632e-05,
"loss": 0.4396,
"step": 1200
},
{
"epoch": 1.744186046511628,
"eval_accuracy": 0.7175,
"eval_accuracy_label_arts, culture, entertainment and media": 0.7894736842105263,
"eval_accuracy_label_conflict, war and peace": 0.663093415007657,
"eval_accuracy_label_crime, law and justice": 0.8195876288659794,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8835616438356164,
"eval_accuracy_label_economy, business, and finance": 0.6893203883495146,
"eval_accuracy_label_environment": 0.3793103448275862,
"eval_accuracy_label_health": 0.8333333333333334,
"eval_accuracy_label_human interest": 0.4090909090909091,
"eval_accuracy_label_labour": 0.5,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.8362369337979094,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.4166666666666667,
"eval_accuracy_label_society": 0.36923076923076925,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 1.0,
"eval_f1": 0.7279616125865503,
"eval_loss": 0.8275023698806763,
"eval_precision": 0.7685711157026855,
"eval_recall": 0.7175,
"eval_runtime": 12.6195,
"eval_samples_per_second": 126.788,
"eval_steps_per_second": 7.924,
"step": 1200
},
{
"epoch": 1.7587209302325582,
"grad_norm": 8.378173828125,
"learning_rate": 1.092071611253197e-05,
"loss": 0.4187,
"step": 1210
},
{
"epoch": 1.7732558139534884,
"grad_norm": 22.63587760925293,
"learning_rate": 1.0792838874680308e-05,
"loss": 0.4558,
"step": 1220
},
{
"epoch": 1.7877906976744184,
"grad_norm": 16.91942596435547,
"learning_rate": 1.0664961636828645e-05,
"loss": 0.6778,
"step": 1230
},
{
"epoch": 1.802325581395349,
"grad_norm": 11.042551040649414,
"learning_rate": 1.0537084398976983e-05,
"loss": 0.5229,
"step": 1240
},
{
"epoch": 1.816860465116279,
"grad_norm": 20.5400390625,
"learning_rate": 1.040920716112532e-05,
"loss": 0.5121,
"step": 1250
},
{
"epoch": 1.8313953488372094,
"grad_norm": 12.495570182800293,
"learning_rate": 1.0281329923273658e-05,
"loss": 0.4737,
"step": 1260
},
{
"epoch": 1.8459302325581395,
"grad_norm": 11.538856506347656,
"learning_rate": 1.0153452685421996e-05,
"loss": 0.3766,
"step": 1270
},
{
"epoch": 1.8604651162790697,
"grad_norm": 8.165515899658203,
"learning_rate": 1.0025575447570333e-05,
"loss": 0.5152,
"step": 1280
},
{
"epoch": 1.875,
"grad_norm": 8.704108238220215,
"learning_rate": 9.897698209718671e-06,
"loss": 0.5027,
"step": 1290
},
{
"epoch": 1.8895348837209303,
"grad_norm": 14.96538257598877,
"learning_rate": 9.769820971867009e-06,
"loss": 0.5427,
"step": 1300
},
{
"epoch": 1.9040697674418605,
"grad_norm": 11.60605525970459,
"learning_rate": 9.641943734015346e-06,
"loss": 0.4236,
"step": 1310
},
{
"epoch": 1.9186046511627906,
"grad_norm": 10.070377349853516,
"learning_rate": 9.514066496163684e-06,
"loss": 0.4683,
"step": 1320
},
{
"epoch": 1.933139534883721,
"grad_norm": 8.57789134979248,
"learning_rate": 9.386189258312021e-06,
"loss": 0.505,
"step": 1330
},
{
"epoch": 1.947674418604651,
"grad_norm": 14.64469051361084,
"learning_rate": 9.258312020460359e-06,
"loss": 0.4311,
"step": 1340
},
{
"epoch": 1.9622093023255816,
"grad_norm": 16.99574851989746,
"learning_rate": 9.130434782608697e-06,
"loss": 0.4414,
"step": 1350
},
{
"epoch": 1.9767441860465116,
"grad_norm": 14.059187889099121,
"learning_rate": 9.002557544757034e-06,
"loss": 0.5001,
"step": 1360
},
{
"epoch": 1.9912790697674418,
"grad_norm": 7.389652729034424,
"learning_rate": 8.874680306905372e-06,
"loss": 0.4546,
"step": 1370
},
{
"epoch": 2.005813953488372,
"grad_norm": 11.378294944763184,
"learning_rate": 8.74680306905371e-06,
"loss": 0.4447,
"step": 1380
},
{
"epoch": 2.020348837209302,
"grad_norm": 9.877668380737305,
"learning_rate": 8.618925831202047e-06,
"loss": 0.4254,
"step": 1390
},
{
"epoch": 2.0348837209302326,
"grad_norm": 5.385466575622559,
"learning_rate": 8.491048593350385e-06,
"loss": 0.383,
"step": 1400
},
{
"epoch": 2.0348837209302326,
"eval_accuracy": 0.745,
"eval_accuracy_label_arts, culture, entertainment and media": 0.6842105263157895,
"eval_accuracy_label_conflict, war and peace": 0.7840735068912711,
"eval_accuracy_label_crime, law and justice": 0.8865979381443299,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8767123287671232,
"eval_accuracy_label_economy, business, and finance": 0.7087378640776699,
"eval_accuracy_label_environment": 0.4482758620689655,
"eval_accuracy_label_health": 0.7777777777777778,
"eval_accuracy_label_human interest": 0.4090909090909091,
"eval_accuracy_label_labour": 0.5,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.6898954703832753,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.4166666666666667,
"eval_accuracy_label_society": 0.2923076923076923,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 0.0,
"eval_f1": 0.7500828579968577,
"eval_loss": 0.7928646206855774,
"eval_precision": 0.7652956903435105,
"eval_recall": 0.745,
"eval_runtime": 12.617,
"eval_samples_per_second": 126.813,
"eval_steps_per_second": 7.926,
"step": 1400
},
{
"epoch": 2.0494186046511627,
"grad_norm": 10.072980880737305,
"learning_rate": 8.363171355498722e-06,
"loss": 0.3935,
"step": 1410
},
{
"epoch": 2.063953488372093,
"grad_norm": 8.466812133789062,
"learning_rate": 8.23529411764706e-06,
"loss": 0.3343,
"step": 1420
},
{
"epoch": 2.078488372093023,
"grad_norm": 8.366528511047363,
"learning_rate": 8.107416879795397e-06,
"loss": 0.3865,
"step": 1430
},
{
"epoch": 2.0930232558139537,
"grad_norm": 9.42149543762207,
"learning_rate": 7.979539641943735e-06,
"loss": 0.3071,
"step": 1440
},
{
"epoch": 2.1075581395348837,
"grad_norm": 7.807155609130859,
"learning_rate": 7.851662404092073e-06,
"loss": 0.3173,
"step": 1450
},
{
"epoch": 2.1220930232558137,
"grad_norm": 9.655524253845215,
"learning_rate": 7.72378516624041e-06,
"loss": 0.4508,
"step": 1460
},
{
"epoch": 2.136627906976744,
"grad_norm": 8.439408302307129,
"learning_rate": 7.595907928388747e-06,
"loss": 0.3745,
"step": 1470
},
{
"epoch": 2.1511627906976742,
"grad_norm": 8.737176895141602,
"learning_rate": 7.468030690537085e-06,
"loss": 0.3132,
"step": 1480
},
{
"epoch": 2.1656976744186047,
"grad_norm": 14.63242244720459,
"learning_rate": 7.340153452685422e-06,
"loss": 0.3235,
"step": 1490
},
{
"epoch": 2.1802325581395348,
"grad_norm": 10.674861907958984,
"learning_rate": 7.21227621483376e-06,
"loss": 0.39,
"step": 1500
},
{
"epoch": 2.1947674418604652,
"grad_norm": 21.4650936126709,
"learning_rate": 7.084398976982097e-06,
"loss": 0.3526,
"step": 1510
},
{
"epoch": 2.2093023255813953,
"grad_norm": 9.0557222366333,
"learning_rate": 6.956521739130435e-06,
"loss": 0.3315,
"step": 1520
},
{
"epoch": 2.2238372093023258,
"grad_norm": 9.88924789428711,
"learning_rate": 6.828644501278773e-06,
"loss": 0.342,
"step": 1530
},
{
"epoch": 2.238372093023256,
"grad_norm": 10.470682144165039,
"learning_rate": 6.70076726342711e-06,
"loss": 0.3666,
"step": 1540
},
{
"epoch": 2.2529069767441863,
"grad_norm": 10.087296485900879,
"learning_rate": 6.572890025575448e-06,
"loss": 0.3509,
"step": 1550
},
{
"epoch": 2.2674418604651163,
"grad_norm": 9.986245155334473,
"learning_rate": 6.4450127877237854e-06,
"loss": 0.2961,
"step": 1560
},
{
"epoch": 2.2819767441860463,
"grad_norm": 4.27475643157959,
"learning_rate": 6.317135549872123e-06,
"loss": 0.3514,
"step": 1570
},
{
"epoch": 2.296511627906977,
"grad_norm": 18.000774383544922,
"learning_rate": 6.189258312020461e-06,
"loss": 0.2998,
"step": 1580
},
{
"epoch": 2.311046511627907,
"grad_norm": 11.935790061950684,
"learning_rate": 6.061381074168798e-06,
"loss": 0.3849,
"step": 1590
},
{
"epoch": 2.3255813953488373,
"grad_norm": 6.844956874847412,
"learning_rate": 5.933503836317136e-06,
"loss": 0.3418,
"step": 1600
},
{
"epoch": 2.3255813953488373,
"eval_accuracy": 0.74375,
"eval_accuracy_label_arts, culture, entertainment and media": 0.7894736842105263,
"eval_accuracy_label_conflict, war and peace": 0.7350689127105666,
"eval_accuracy_label_crime, law and justice": 0.9072164948453608,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8493150684931506,
"eval_accuracy_label_economy, business, and finance": 0.7864077669902912,
"eval_accuracy_label_environment": 0.4482758620689655,
"eval_accuracy_label_health": 0.7777777777777778,
"eval_accuracy_label_human interest": 0.3181818181818182,
"eval_accuracy_label_labour": 0.5,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.7909407665505227,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.4166666666666667,
"eval_accuracy_label_society": 0.18461538461538463,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 0.0,
"eval_f1": 0.7440049917955611,
"eval_loss": 0.804217517375946,
"eval_precision": 0.768551401471047,
"eval_recall": 0.74375,
"eval_runtime": 12.6056,
"eval_samples_per_second": 126.928,
"eval_steps_per_second": 7.933,
"step": 1600
},
{
"epoch": 2.3401162790697674,
"grad_norm": 14.338434219360352,
"learning_rate": 5.8056265984654735e-06,
"loss": 0.2883,
"step": 1610
},
{
"epoch": 2.354651162790698,
"grad_norm": 5.656998634338379,
"learning_rate": 5.677749360613811e-06,
"loss": 0.2737,
"step": 1620
},
{
"epoch": 2.369186046511628,
"grad_norm": 6.466466903686523,
"learning_rate": 5.549872122762149e-06,
"loss": 0.331,
"step": 1630
},
{
"epoch": 2.383720930232558,
"grad_norm": 11.816296577453613,
"learning_rate": 5.421994884910486e-06,
"loss": 0.3733,
"step": 1640
},
{
"epoch": 2.3982558139534884,
"grad_norm": 8.958051681518555,
"learning_rate": 5.294117647058824e-06,
"loss": 0.2802,
"step": 1650
},
{
"epoch": 2.4127906976744184,
"grad_norm": 13.985147476196289,
"learning_rate": 5.1662404092071615e-06,
"loss": 0.353,
"step": 1660
},
{
"epoch": 2.427325581395349,
"grad_norm": 17.26644515991211,
"learning_rate": 5.038363171355499e-06,
"loss": 0.3399,
"step": 1670
},
{
"epoch": 2.441860465116279,
"grad_norm": 13.139063835144043,
"learning_rate": 4.910485933503837e-06,
"loss": 0.2949,
"step": 1680
},
{
"epoch": 2.4563953488372094,
"grad_norm": 15.950389862060547,
"learning_rate": 4.782608695652174e-06,
"loss": 0.3742,
"step": 1690
},
{
"epoch": 2.4709302325581395,
"grad_norm": 8.10091495513916,
"learning_rate": 4.654731457800512e-06,
"loss": 0.2605,
"step": 1700
},
{
"epoch": 2.4854651162790695,
"grad_norm": 8.73356819152832,
"learning_rate": 4.5268542199488496e-06,
"loss": 0.2077,
"step": 1710
},
{
"epoch": 2.5,
"grad_norm": 7.236685276031494,
"learning_rate": 4.398976982097187e-06,
"loss": 0.3526,
"step": 1720
},
{
"epoch": 2.5145348837209305,
"grad_norm": 6.902716159820557,
"learning_rate": 4.271099744245525e-06,
"loss": 0.2633,
"step": 1730
},
{
"epoch": 2.5290697674418605,
"grad_norm": 4.061647891998291,
"learning_rate": 4.143222506393862e-06,
"loss": 0.2682,
"step": 1740
},
{
"epoch": 2.5436046511627906,
"grad_norm": 3.789299488067627,
"learning_rate": 4.0153452685422e-06,
"loss": 0.2996,
"step": 1750
},
{
"epoch": 2.558139534883721,
"grad_norm": 7.185976505279541,
"learning_rate": 3.887468030690537e-06,
"loss": 0.323,
"step": 1760
},
{
"epoch": 2.572674418604651,
"grad_norm": 9.113693237304688,
"learning_rate": 3.7595907928388748e-06,
"loss": 0.2854,
"step": 1770
},
{
"epoch": 2.5872093023255816,
"grad_norm": 10.132606506347656,
"learning_rate": 3.6317135549872124e-06,
"loss": 0.351,
"step": 1780
},
{
"epoch": 2.6017441860465116,
"grad_norm": 12.435748100280762,
"learning_rate": 3.50383631713555e-06,
"loss": 0.3271,
"step": 1790
},
{
"epoch": 2.616279069767442,
"grad_norm": 15.90312671661377,
"learning_rate": 3.3759590792838876e-06,
"loss": 0.248,
"step": 1800
},
{
"epoch": 2.616279069767442,
"eval_accuracy": 0.7275,
"eval_accuracy_label_arts, culture, entertainment and media": 0.6842105263157895,
"eval_accuracy_label_conflict, war and peace": 0.6891271056661562,
"eval_accuracy_label_crime, law and justice": 0.8814432989690721,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8698630136986302,
"eval_accuracy_label_economy, business, and finance": 0.7572815533980582,
"eval_accuracy_label_environment": 0.41379310344827586,
"eval_accuracy_label_health": 0.8333333333333334,
"eval_accuracy_label_human interest": 0.4090909090909091,
"eval_accuracy_label_labour": 0.5,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.8013937282229965,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.4166666666666667,
"eval_accuracy_label_society": 0.27692307692307694,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 0.0,
"eval_f1": 0.7324830328014649,
"eval_loss": 0.8387188911437988,
"eval_precision": 0.7610492043473545,
"eval_recall": 0.7275,
"eval_runtime": 12.5904,
"eval_samples_per_second": 127.081,
"eval_steps_per_second": 7.943,
"step": 1800
},
{
"epoch": 2.630813953488372,
"grad_norm": 14.707446098327637,
"learning_rate": 3.248081841432225e-06,
"loss": 0.3358,
"step": 1810
},
{
"epoch": 2.645348837209302,
"grad_norm": 8.684798240661621,
"learning_rate": 3.120204603580563e-06,
"loss": 0.3082,
"step": 1820
},
{
"epoch": 2.6598837209302326,
"grad_norm": 8.125092506408691,
"learning_rate": 2.9923273657289004e-06,
"loss": 0.2818,
"step": 1830
},
{
"epoch": 2.6744186046511627,
"grad_norm": 10.351339340209961,
"learning_rate": 2.864450127877238e-06,
"loss": 0.3465,
"step": 1840
},
{
"epoch": 2.688953488372093,
"grad_norm": 9.536513328552246,
"learning_rate": 2.7365728900255756e-06,
"loss": 0.3022,
"step": 1850
},
{
"epoch": 2.703488372093023,
"grad_norm": 7.122174263000488,
"learning_rate": 2.6086956521739132e-06,
"loss": 0.3742,
"step": 1860
},
{
"epoch": 2.7180232558139537,
"grad_norm": 11.325377464294434,
"learning_rate": 2.480818414322251e-06,
"loss": 0.2912,
"step": 1870
},
{
"epoch": 2.7325581395348837,
"grad_norm": 9.651542663574219,
"learning_rate": 2.3529411764705885e-06,
"loss": 0.3156,
"step": 1880
},
{
"epoch": 2.7470930232558137,
"grad_norm": 16.223478317260742,
"learning_rate": 2.225063938618926e-06,
"loss": 0.3405,
"step": 1890
},
{
"epoch": 2.761627906976744,
"grad_norm": 6.137476921081543,
"learning_rate": 2.0971867007672637e-06,
"loss": 0.1922,
"step": 1900
},
{
"epoch": 2.7761627906976747,
"grad_norm": 9.50839614868164,
"learning_rate": 1.9693094629156013e-06,
"loss": 0.2896,
"step": 1910
},
{
"epoch": 2.7906976744186047,
"grad_norm": 8.988372802734375,
"learning_rate": 1.8414322250639389e-06,
"loss": 0.3286,
"step": 1920
},
{
"epoch": 2.8052325581395348,
"grad_norm": 9.569466590881348,
"learning_rate": 1.7135549872122765e-06,
"loss": 0.3463,
"step": 1930
},
{
"epoch": 2.8197674418604652,
"grad_norm": 7.808605194091797,
"learning_rate": 1.585677749360614e-06,
"loss": 0.3117,
"step": 1940
},
{
"epoch": 2.8343023255813953,
"grad_norm": 9.752486228942871,
"learning_rate": 1.4578005115089517e-06,
"loss": 0.3708,
"step": 1950
},
{
"epoch": 2.8488372093023253,
"grad_norm": 6.103060722351074,
"learning_rate": 1.3299232736572893e-06,
"loss": 0.2766,
"step": 1960
},
{
"epoch": 2.863372093023256,
"grad_norm": 8.869214057922363,
"learning_rate": 1.2020460358056267e-06,
"loss": 0.2762,
"step": 1970
},
{
"epoch": 2.8779069767441863,
"grad_norm": 8.96507740020752,
"learning_rate": 1.0741687979539643e-06,
"loss": 0.2874,
"step": 1980
},
{
"epoch": 2.8924418604651163,
"grad_norm": 8.362478256225586,
"learning_rate": 9.462915601023019e-07,
"loss": 0.2944,
"step": 1990
},
{
"epoch": 2.9069767441860463,
"grad_norm": 7.523708820343018,
"learning_rate": 8.184143222506395e-07,
"loss": 0.2525,
"step": 2000
},
{
"epoch": 2.9069767441860463,
"eval_accuracy": 0.735,
"eval_accuracy_label_arts, culture, entertainment and media": 0.6842105263157895,
"eval_accuracy_label_conflict, war and peace": 0.7105666156202144,
"eval_accuracy_label_crime, law and justice": 0.8762886597938144,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8698630136986302,
"eval_accuracy_label_economy, business, and finance": 0.6796116504854369,
"eval_accuracy_label_environment": 0.4482758620689655,
"eval_accuracy_label_health": 0.7222222222222222,
"eval_accuracy_label_human interest": 0.36363636363636365,
"eval_accuracy_label_labour": 0.5,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.8153310104529616,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.4583333333333333,
"eval_accuracy_label_society": 0.3384615384615385,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 0.0,
"eval_f1": 0.7412823760546817,
"eval_loss": 0.8137220740318298,
"eval_precision": 0.7696596009813345,
"eval_recall": 0.735,
"eval_runtime": 12.5933,
"eval_samples_per_second": 127.051,
"eval_steps_per_second": 7.941,
"step": 2000
},
{
"epoch": 2.921511627906977,
"grad_norm": 9.854249954223633,
"learning_rate": 6.90537084398977e-07,
"loss": 0.2625,
"step": 2010
},
{
"epoch": 2.936046511627907,
"grad_norm": 7.306544780731201,
"learning_rate": 5.626598465473146e-07,
"loss": 0.3285,
"step": 2020
},
{
"epoch": 2.9505813953488373,
"grad_norm": 4.267274856567383,
"learning_rate": 4.347826086956522e-07,
"loss": 0.3445,
"step": 2030
},
{
"epoch": 2.9651162790697674,
"grad_norm": 15.480578422546387,
"learning_rate": 3.069053708439898e-07,
"loss": 0.3066,
"step": 2040
},
{
"epoch": 2.979651162790698,
"grad_norm": 11.125273704528809,
"learning_rate": 1.7902813299232738e-07,
"loss": 0.3026,
"step": 2050
},
{
"epoch": 2.994186046511628,
"grad_norm": 12.110825538635254,
"learning_rate": 5.115089514066497e-08,
"loss": 0.2815,
"step": 2060
},
{
"epoch": 3.0,
"step": 2064,
"total_flos": 8687308686630912.0,
"train_loss": 0.8068887479603291,
"train_runtime": 1561.1428,
"train_samples_per_second": 42.294,
"train_steps_per_second": 1.322
},
{
"epoch": 3.0,
"eval_accuracy": 0.743125,
"eval_accuracy_label_arts, culture, entertainment and media": 0.6842105263157895,
"eval_accuracy_label_conflict, war and peace": 0.7350689127105666,
"eval_accuracy_label_crime, law and justice": 0.8917525773195877,
"eval_accuracy_label_disaster, accident, and emergency incident": 0.8698630136986302,
"eval_accuracy_label_economy, business, and finance": 0.6893203883495146,
"eval_accuracy_label_environment": 0.4482758620689655,
"eval_accuracy_label_health": 0.7222222222222222,
"eval_accuracy_label_human interest": 0.3181818181818182,
"eval_accuracy_label_labour": 0.5,
"eval_accuracy_label_lifestyle and leisure": 0.5555555555555556,
"eval_accuracy_label_politics": 0.7909407665505227,
"eval_accuracy_label_religion": 0.0,
"eval_accuracy_label_science and technology": 0.4583333333333333,
"eval_accuracy_label_society": 0.35384615384615387,
"eval_accuracy_label_sport": 0.9615384615384616,
"eval_accuracy_label_weather": 0.0,
"eval_f1": 0.747448709907019,
"eval_loss": 0.8030127882957458,
"eval_precision": 0.7695117491320402,
"eval_recall": 0.743125,
"eval_runtime": 12.5023,
"eval_samples_per_second": 127.976,
"eval_steps_per_second": 7.999,
"step": 2064
}
],
"logging_steps": 10,
"max_steps": 2064,
"num_input_tokens_seen": 0,
"num_train_epochs": 3,
"save_steps": 1000,
"total_flos": 8687308686630912.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}